diff --git "a/openvino_model.xml" "b/openvino_model.xml" new file mode 100644--- /dev/null +++ "b/openvino_model.xml" @@ -0,0 +1,186959 @@ +<?xml version="1.0"?> +<net name="Model0" version="11"> + <layers> + <layer id="3" name="input_ids" type="Parameter" version="opset1"> + <data shape="?,?" element_type="i64" /> + <output> + <port id="0" precision="I64" names="input_ids"> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="2" name="attention_mask" type="Parameter" version="opset1"> + <data shape="?,?" element_type="i64" /> + <output> + <port id="0" precision="I64" names="attention_mask"> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="1" name="position_ids" type="Parameter" version="opset1"> + <data shape="?,?" element_type="i64" /> + <output> + <port id="0" precision="I64" names="position_ids"> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="0" name="beam_idx" type="Parameter" version="opset1"> + <data shape="?" element_type="i32" /> + <output> + <port id="0" precision="I32" names="beam_idx"> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="4" name="Constant_340762" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="5" name="ShapeOf_340748" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="I64"> + <dim>-1</dim> + <dim>-1</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="6" name="Constant_340750" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7" name="Constant_340752" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="8" name="Gather_340753" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9" name="Constant_340755" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="12" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10" name="Constant_340757" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="11" name="Constant_340759" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="20" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="12" name="Concat_340760" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="13" name="Broadcast_340763" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32" /> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="14" name="ReadValue_333266" type="ReadValue" version="opset6"> + <data variable_id="past_key_values.9.valuepresent.9.value" variable_type="f32" variable_shape="?,8,?,128" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="past_key_values.9.value"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="15" name="Constant_325366" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="16" name="Gather_325367" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="17" name="Constant_290141" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 5120" offset="28" size="20480" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="18" name="self.model.embed_tokens.weight" type="Const" version="opset1"> + <data element_type="u8" shape="152064, 5120" offset="20508" size="778567680" /> + <output> + <port id="0" precision="U8"> + <dim>152064</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="19" name="Convert_384568" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>152064</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>152064</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="20" name="self.model.embed_tokens.weight/zero_point" type="Const" version="opset1"> + <data element_type="u8" shape="152064, 1" offset="778588188" size="152064" /> + <output> + <port id="0" precision="U8"> + <dim>152064</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="21" name="Convert_384571" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>152064</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>152064</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="22" name="self.model.embed_tokens.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>152064</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP16"> + <dim>152064</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>152064</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="23" name="self.model.embed_tokens.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="152064, 1" offset="778740252" size="304128" /> + <output> + <port id="0" precision="FP16"> + <dim>152064</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="24" name="self.model.embed_tokens.weight/fq_weights_0" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>152064</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP16"> + <dim>152064</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>152064</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="25" name="__module.model.embed_tokens/prim::PythonOp/Convert" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>152064</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>152064</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="26" name="__module.model.embed_tokens/prim::PythonOp/Convert_1" type="Convert" version="opset1"> + <data destination_type="i32" /> + <input> + <port id="0" precision="I64"> + <dim>-1</dim> + <dim>-1</dim> + </port> + </input> + <output> + <port id="1" precision="I32"> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="27" name="__module.model.embed_tokens/prim::PythonOp/Constant" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="28" name="__module.model.embed_tokens/prim::PythonOp/Gather" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>152064</dim> + <dim>5120</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="FP32" names="449,529,540,hidden_states.1,inputs_embeds"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="29" name="Constant_290050" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 5120" offset="779044380" size="20480" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="30" name="Constant_290049" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064860" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="31" name="Constant_290047" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064864" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="32" name="__module.model.layers.0.input_layernorm/aten::pow/Power" type="Power" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="530"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="33" name="Constant_520" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64" names="531"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="34" name="__module.model.layers.0.input_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> + <data keep_dims="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="532,variance.1"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="35" name="Constant_290048" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064876" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="36" name="__module.model.layers.0.input_layernorm/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="533"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="37" name="__module.model.layers.0.input_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="38" name="__module.model.layers.0.input_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="534"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="39" name="__module.model.layers.0.input_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="535,536,hidden_states.3,hidden_states.5"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="40" name="__module.model.layers.0.input_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="537,539,hidden_states.7"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="41" name="self.model.layers.0.self_attn.q_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 128" offset="779064880" size="13107200" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="42" name="Convert_386027" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="43" name="self.model.layers.0.self_attn.q_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 1" offset="792172080" size="102400" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="44" name="Convert_386029" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="45" name="self.model.layers.0.self_attn.q_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="46" name="self.model.layers.0.self_attn.q_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="5120, 40, 1" offset="792274480" size="409600" /> + <output> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="47" name="self.model.layers.0.self_attn.q_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="48" name="Constant_386034" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="792684080" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="49" name="Reshape_386035" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="50" name="__module.model.layers.0.self_attn.q_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="51" name="__module.model.layers.0.self_attn.q_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="52" name="self.model.layers.0.self_attn.q_proj.bias" type="Const" version="opset1"> + <data element_type="bf16" shape="5120" offset="792684096" size="10240" /> + <output> + <port id="0" precision="BF16" names="self.model.layers.0.self_attn.q_proj.bias"> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="53" name="__module.model.layers.0.self_attn.q_proj/prim::PythonOp/ConvertLike_1" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="BF16"> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="54" name="__module.model.layers.0.self_attn.q_proj/prim::PythonOp/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="549,query_states.1"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="55" name="Constant_301697" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="792694336" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="56" name="__module.model.layers.0.self_attn/aten::view/Reshape" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="557"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="57" name="__module.model.layers.0.self_attn/aten::transpose/ScatterElementsUpdate" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="58" name="__module.model.layers.0.self_attn/aten::transpose/Transpose" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="558,q.1"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="59" name="__module.model.rotary_emb/aten::to/Convert" type="Const" version="opset1"> + <data element_type="f32" shape="1, 64, 1" offset="792694384" size="256" /> + <output> + <port id="0" precision="FP32" names="501"> + <dim>1</dim> + <dim>64</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="60" name="ShapeOf_297528" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="I64"> + <dim>-1</dim> + <dim>-1</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="61" name="Constant_297529" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="62" name="Constant_297530" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="63" name="Gather_297531" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64" names="502"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="64" name="Constant_267815" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="65" name="Constant_267817" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="66" name="__module.model.rotary_emb/prim::ListConstruct/Concat" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="3" precision="I64" names="503"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="67" name="__module.model.rotary_emb/aten::expand/Broadcast" type="Broadcast" version="opset3"> + <data mode="bidirectional" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>64</dim> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>3</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="504,509,inv_freq_expanded,inv_freq_expanded.1"> + <dim>-1</dim> + <dim>64</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="68" name="343" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64" names="343" /> + </output> + </layer> + <layer id="69" name="__module.model.rotary_emb/aten::unsqueeze/Unsqueeze" type="Unsqueeze" version="opset1"> + <input> + <port id="0" precision="I64"> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" names="506,507"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="70" name="__module.model.rotary_emb/aten::to/Convert_2" type="Convert" version="opset1"> + <data destination_type="f32" /> + <input> + <port id="0" precision="I64"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="508,510,position_ids_expanded,position_ids_expanded.1"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="71" name="__module.model.rotary_emb/aten::matmul/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="false" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>64</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="511"> + <dim>-1</dim> + <dim>64</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="72" name="__module.model.rotary_emb/aten::transpose/ScatterElementsUpdate" type="Const" version="opset1"> + <data element_type="i32" shape="3" offset="792694648" size="12" /> + <output> + <port id="0" precision="I32"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="73" name="__module.model.rotary_emb/aten::transpose/Transpose" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>64</dim> + <dim>-1</dim> + </port> + <port id="1" precision="I32"> + <dim>3</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="512"> + <dim>-1</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="74" name="__module.model.rotary_emb/aten::cat/Concat" type="Concat" version="opset1"> + <data axis="-1" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="514,emb"> + <dim>-1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="75" name="__module.model.rotary_emb/aten::cos/Cos" type="Cos" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="515,517,519,522,cos.1,cos.3,cos.5"> + <dim>-1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="76" name="__module.model.layers.0.self_attn/aten::unsqueeze/Unsqueeze" type="Unsqueeze" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="FP32" names="1039,1196,1353,1510,1667,1824,1981,2138,2295,2452,2609,2766,2923,3080,3237,3394,3551,3708,3865,4022,4179,4336,4493,4650,4807,4964,5121,5278,5435,5592,565,5749,5906,6063,6220,6377,6534,6691,6848,7005,7162,725,7319,7476,7633,7790,7947,882,cos,cos.11,cos.13,cos.15,cos.17,cos.19,cos.21,cos.23,cos.25,cos.27,cos.29,cos.31,cos.33,cos.35,cos.37,cos.39,cos.41,cos.43,cos.45,cos.47,cos.49,cos.51,cos.53,cos.55,cos.57,cos.59,cos.61,cos.63,cos.65,cos.67,cos.69,cos.7,cos.71,cos.73,cos.75,cos.77,cos.79,cos.81,cos.83,cos.85,cos.87,cos.89,cos.9,cos.91,cos.93,cos.95,cos.97,cos.99"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="77" name="__module.model.layers.0.self_attn/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="567"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="78" name="__module.model.layers.0.self_attn/aten::size/ShapeOf_3" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="79" name="334" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64" names="334" /> + </output> + </layer> + <layer id="80" name="__module.model.layers.0.self_attn/aten::size/Constant_3" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="81" name="__module.model.layers.0.self_attn/aten::size/Gather_3" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="568,573" /> + </output> + </layer> + <layer id="82" name="Constant_65" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="792694668" size="8" /> + <output> + <port id="0" precision="I64" names="328" /> + </output> + </layer> + <layer id="83" name="__module.model.layers.0.self_attn/aten::floor_divide/Divide_1" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" /> + </output> + </layer> + <layer id="84" name="__module.model.layers.0.self_attn/aten::floor_divide/Floor_1" type="Floor" version="opset1"> + <input> + <port id="0" precision="I64" /> + </input> + <output> + <port id="1" precision="I64" names="570,571,575,576" /> + </output> + </layer> + <layer id="85" name="Constant_220537" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="86" name="__module.model.layers.0.self_attn/aten::slice/Reshape_5" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="87" name="__module.model.layers.0.self_attn/aten::slice/Reshape_1" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694676" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="88" name="__module.model.layers.0.self_attn/aten::slice/Reshape_2" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="89" name="__module.model.layers.0.self_attn/aten::slice/Reshape_3" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="90" name="__module.model.layers.0.self_attn/aten::slice/Slice" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="577,x2.1"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="91" name="Constant_290051" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1, 1" offset="792694684" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="92" name="__module.model.layers.0.self_attn/aten::neg/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="578"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="93" name="__module.model.layers.0.self_attn/aten::slice/Reshape_4" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="94" name="__module.model.layers.0.self_attn/aten::slice/Reshape_6" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="95" name="__module.model.layers.0.self_attn/aten::slice/Reshape_7" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="96" name="__module.model.layers.0.self_attn/aten::slice/Slice_1" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="572"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="97" name="__module.model.layers.0.self_attn/aten::cat/Concat" type="Concat" version="opset1"> + <data axis="-1" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="580"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="98" name="__module.model.rotary_emb/aten::sin/Sin" type="Sin" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="516,518,520,523,sin.1,sin.3,sin.5"> + <dim>-1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="99" name="__module.model.layers.0.self_attn/aten::unsqueeze/Unsqueeze_1" type="Unsqueeze" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="FP32" names="1040,1197,1354,1511,1668,1825,1982,2139,2296,2453,2610,2767,2924,3081,3238,3395,3552,3709,3866,4023,4180,4337,4494,4651,4808,4965,5122,5279,5436,5593,566,5750,5907,6064,6221,6378,6535,6692,6849,7006,7163,726,7320,7477,7634,7791,7948,883,sin,sin.11,sin.13,sin.15,sin.17,sin.19,sin.21,sin.23,sin.25,sin.27,sin.29,sin.31,sin.33,sin.35,sin.37,sin.39,sin.41,sin.43,sin.45,sin.47,sin.49,sin.51,sin.53,sin.55,sin.57,sin.59,sin.61,sin.63,sin.65,sin.67,sin.69,sin.7,sin.71,sin.73,sin.75,sin.77,sin.79,sin.81,sin.83,sin.85,sin.87,sin.89,sin.9,sin.91,sin.93,sin.95,sin.97,sin.99"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="100" name="__module.model.layers.0.self_attn/aten::mul/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="581"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="101" name="__module.model.layers.0.self_attn/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="582"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="102" name="Constant_340775" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="103" name="Constant_340768" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="12" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="104" name="Constant_340770" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="105" name="Constant_340772" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="20" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="106" name="Concat_340773" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="107" name="Broadcast_340776" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32" /> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="108" name="ReadValue_333076" type="ReadValue" version="opset6"> + <data variable_id="past_key_values.0.keypresent.0.key" variable_type="f32" variable_shape="?,8,?,128" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="past_key_values.0.key"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="109" name="Constant_325309" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="110" name="Gather_325310" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="111" name="self.model.layers.0.self_attn.k_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 128" offset="792694688" size="2621440" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="112" name="Convert_386987" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="113" name="self.model.layers.0.self_attn.k_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 1" offset="795316128" size="20480" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="114" name="Convert_386989" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="115" name="self.model.layers.0.self_attn.k_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="116" name="self.model.layers.0.self_attn.k_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="1024, 40, 1" offset="795336608" size="81920" /> + <output> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="117" name="self.model.layers.0.self_attn.k_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="118" name="Constant_386994" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795418528" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="119" name="Reshape_386995" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="120" name="__module.model.layers.0.self_attn.k_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="121" name="__module.model.layers.0.self_attn.k_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="122" name="self.model.layers.0.self_attn.k_proj.bias" type="Const" version="opset1"> + <data element_type="bf16" shape="1024" offset="795418544" size="2048" /> + <output> + <port id="0" precision="BF16" names="self.model.layers.0.self_attn.k_proj.bias"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="123" name="__module.model.layers.0.self_attn.k_proj/prim::PythonOp/ConvertLike_1" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="BF16"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="124" name="__module.model.layers.0.self_attn.k_proj/prim::PythonOp/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="552,key_states.3"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="125" name="Constant_301698" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420592" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="126" name="__module.model.layers.0.self_attn/aten::view/Reshape_1" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="560"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="127" name="__module.model.layers.0.self_attn/aten::transpose/ScatterElementsUpdate_1" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="128" name="__module.model.layers.0.self_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="561,k.1"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="129" name="__module.model.layers.0.self_attn/aten::mul/Multiply_2" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="583"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="130" name="__module.model.layers.0.self_attn/aten::size/ShapeOf_5" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="131" name="__module.model.layers.0.self_attn/aten::size/Constant_5" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="132" name="__module.model.layers.0.self_attn/aten::size/Gather_5" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="584,589" /> + </output> + </layer> + <layer id="133" name="__module.model.layers.0.self_attn/aten::floor_divide/Divide_3" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" /> + </output> + </layer> + <layer id="134" name="__module.model.layers.0.self_attn/aten::floor_divide/Floor_3" type="Floor" version="opset1"> + <input> + <port id="0" precision="I64" /> + </input> + <output> + <port id="1" precision="I64" names="586,587,591,592" /> + </output> + </layer> + <layer id="135" name="Constant_220539" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="136" name="__module.model.layers.0.self_attn/aten::slice/Reshape_13" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="137" name="__module.model.layers.0.self_attn/aten::slice/Reshape_9" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694676" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="138" name="__module.model.layers.0.self_attn/aten::slice/Reshape_10" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="139" name="__module.model.layers.0.self_attn/aten::slice/Reshape_11" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="140" name="__module.model.layers.0.self_attn/aten::slice/Slice_2" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="593,x2.3"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="141" name="Constant_290052" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1, 1" offset="792694684" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="142" name="__module.model.layers.0.self_attn/aten::neg/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="594"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="143" name="__module.model.layers.0.self_attn/aten::slice/Reshape_12" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="144" name="__module.model.layers.0.self_attn/aten::slice/Reshape_14" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="145" name="__module.model.layers.0.self_attn/aten::slice/Reshape_15" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="146" name="__module.model.layers.0.self_attn/aten::slice/Slice_3" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="588"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="147" name="__module.model.layers.0.self_attn/aten::cat/Concat_1" type="Concat" version="opset1"> + <data axis="-1" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="596"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="148" name="__module.model.layers.0.self_attn/aten::mul/Multiply_3" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="597"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="149" name="__module.model.layers.0.self_attn/aten::add/Add_1" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="598,key_states.5"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="150" name="__module.model.layers.0.self_attn/aten::cat/Concat_2" type="Concat" version="opset1"> + <data axis="-2" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="present.0.key"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="151" name="345" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="792694668" size="8" /> + <output> + <port id="0" precision="I64" names="345" /> + </output> + </layer> + <layer id="152" name="__module.model.layers.0.self_attn/aten::unsqueeze/Unsqueeze_2" type="Unsqueeze" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="FP32" names="613,614,615"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="153" name="ShapeOf_297561" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="154" name="Constant_297572" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="155" name="Constant_297573" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="156" name="Gather_297574" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64" names="606"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="157" name="__module.model.layers.0.self_attn/aten::size/ShapeOf_6" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="158" name="Constant_302082" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="159" name="__module.model.layers.0.self_attn/aten::size/Constant_7" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="160" name="__module.model.layers.0.self_attn/aten::size/Gather_7" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="607"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="161" name="Constant_267824" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="795420624" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="162" name="Constant_276191" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795420632" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="163" name="Constant_276192" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="164" name="Gather_276193" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="165" name="__module.model.layers.0.self_attn/prim::ListConstruct/Concat_2" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="4" precision="I64" names="616"> + <dim>5</dim> + </port> + </output> + </layer> + <layer id="166" name="__module.model.layers.0.self_attn/aten::expand/Broadcast" type="Broadcast" version="opset3"> + <data mode="bidirectional" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>5</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="617,hidden_states.11"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="167" name="Constant_301699" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420648" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="168" name="__module.model.layers.0.self_attn/aten::reshape/Reshape" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="621,key_states.7"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="169" name="Constant_340788" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="170" name="Constant_340781" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="12" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="171" name="Constant_340783" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="172" name="Constant_340785" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="20" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="173" name="Concat_340786" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="174" name="Broadcast_340789" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32" /> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="175" name="ReadValue_333078" type="ReadValue" version="opset6"> + <data variable_id="past_key_values.0.valuepresent.0.value" variable_type="f32" variable_shape="?,8,?,128" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="past_key_values.0.value"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="176" name="Constant_325312" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="177" name="Gather_325313" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="178" name="self.model.layers.0.self_attn.v_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 128" offset="795420680" size="2621440" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="179" name="Convert_386997" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="180" name="self.model.layers.0.self_attn.v_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 1" offset="798042120" size="20480" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="181" name="Convert_386999" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="182" name="self.model.layers.0.self_attn.v_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="183" name="self.model.layers.0.self_attn.v_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="1024, 40, 1" offset="798062600" size="81920" /> + <output> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="184" name="self.model.layers.0.self_attn.v_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="185" name="Constant_387004" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795418528" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="186" name="Reshape_387005" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="187" name="__module.model.layers.0.self_attn.v_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="188" name="__module.model.layers.0.self_attn.v_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="189" name="self.model.layers.0.self_attn.v_proj.bias" type="Const" version="opset1"> + <data element_type="bf16" shape="1024" offset="798144520" size="2048" /> + <output> + <port id="0" precision="BF16" names="self.model.layers.0.self_attn.v_proj.bias"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="190" name="__module.model.layers.0.self_attn.v_proj/prim::PythonOp/ConvertLike_1" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="BF16"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="191" name="__module.model.layers.0.self_attn.v_proj/prim::PythonOp/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="555,value_states.1"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="192" name="Constant_301700" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420592" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="193" name="__module.model.layers.0.self_attn/aten::view/Reshape_2" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="563"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="194" name="__module.model.layers.0.self_attn/aten::transpose/ScatterElementsUpdate_2" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="195" name="__module.model.layers.0.self_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="564"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="196" name="__module.model.layers.0.self_attn/aten::cat/Concat_3" type="Concat" version="opset1"> + <data axis="-2" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="present.0.value"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="197" name="__module.model.layers.0.self_attn/aten::unsqueeze/Unsqueeze_3" type="Unsqueeze" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="FP32" names="629,630,631"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="198" name="ShapeOf_297533" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="199" name="Constant_297567" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="200" name="Constant_297568" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="201" name="Gather_297569" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64" names="1093,1250,1407,1564,1721,1878,2035,2192,2349,2506,2663,2820,2977,3134,3291,3448,3605,3762,3919,4076,4233,4390,4547,4704,472,4861,5018,5175,5332,5489,5646,5803,5960,6117,622,6274,6431,6588,6745,6902,7059,7216,7373,7530,7687,779,7844,8001,936"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="202" name="__module.model.layers.0.self_attn/aten::size/ShapeOf_10" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="203" name="Constant_302085" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="204" name="__module.model.layers.0.self_attn/aten::size/Constant_11" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="205" name="__module.model.layers.0.self_attn/aten::size/Gather_11" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="623"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="206" name="Constant_267842" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="795420624" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="207" name="Constant_276201" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795420632" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="208" name="Constant_276202" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="209" name="Gather_276203" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="210" name="__module.model.layers.0.self_attn/prim::ListConstruct/Concat_5" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="4" precision="I64" names="632"> + <dim>5</dim> + </port> + </output> + </layer> + <layer id="211" name="__module.model.layers.0.self_attn/aten::expand/Broadcast_1" type="Broadcast" version="opset3"> + <data mode="bidirectional" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>5</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="633,hidden_states.15"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="212" name="Constant_301701" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420648" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="213" name="__module.model.layers.0.self_attn/aten::reshape/Reshape_1" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="637"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="214" name="__module.model/aten::triu/Constant" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="215" name="Multiply_282375" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="798146568" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="216" name="Constant_282380" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="798146572" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="217" name="Constant_297534" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="218" name="Constant_297535" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="219" name="Gather_297536" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64" names="452,457" /> + </output> + </layer> + <layer id="220" name="Constant_297538" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="221" name="Reshape_297539" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="222" name="ShapeOf_297541" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="I64"> + <dim>-1</dim> + <dim>-1</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="223" name="Constant_297542" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="224" name="Constant_297543" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="225" name="Gather_297544" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64" names="458,476" /> + </output> + </layer> + <layer id="226" name="Constant_297546" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="227" name="Reshape_297547" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="228" name="__module.model/prim::ListConstruct/Concat" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64" names="459"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="229" name="Maximum_282381" type="Maximum" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="230" name="__module.model/aten::mul/Multiply" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32" /> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="461"> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="231" name="ShapeOf_297549" type="ShapeOf" version="opset3"> + <data output_type="i32" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + </port> + </input> + <output> + <port id="1" precision="I32"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="232" name="Constant_297550" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="233" name="Constant_297551" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="234" name="Gather_297552" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I32"> + <dim>2</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I32" /> + </output> + </layer> + <layer id="235" name="__module.model/aten::triu/Constant_2" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="798146588" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="236" name="__module.model/aten::triu/Range" type="Range" version="opset4"> + <data output_type="i32" /> + <input> + <port id="0" precision="I32" /> + <port id="1" precision="I32" /> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I32"> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="237" name="__module.model/aten::triu/Unsqueeze" type="Unsqueeze" version="opset1"> + <input> + <port id="0" precision="I32"> + <dim>-1</dim> + </port> + <port id="1" precision="I32" /> + </input> + <output> + <port id="2" precision="I32"> + <dim>1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="238" name="__module.model/aten::triu/Convert" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="798146588" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="239" name="Constant_297556" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="240" name="Constant_297557" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="241" name="Gather_297558" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I32"> + <dim>2</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I32" /> + </output> + </layer> + <layer id="242" name="__module.model/aten::triu/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="I32" /> + <port id="1" precision="I32" /> + </input> + <output> + <port id="2" precision="I32" /> + </output> + </layer> + <layer id="243" name="__module.model/aten::triu/Range_1" type="Range" version="opset4"> + <data output_type="i32" /> + <input> + <port id="0" precision="I32" /> + <port id="1" precision="I32" /> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I32"> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="244" name="__module.model/aten::triu/Unsqueeze_1" type="Unsqueeze" version="opset1"> + <input> + <port id="0" precision="I32"> + <dim>-1</dim> + </port> + <port id="1" precision="I32" /> + </input> + <output> + <port id="2" precision="I32"> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="245" name="__module.model/aten::triu/GreaterEqual" type="GreaterEqual" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="I32"> + <dim>1</dim> + <dim>-1</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="BOOL"> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="246" name="__module.model/aten::triu/ConvertLike" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="247" name="__module.model/aten::triu/Select" type="Select" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="BOOL"> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="2" precision="FP32" /> + </input> + <output> + <port id="3" precision="FP32" names="462_1"> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="248" name="__module.model/aten::arange/Constant" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="249" name="__module.model/aten::arange/Constant_1" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="798146588" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="250" name="__module.model/aten::arange/Range" type="Range" version="opset4"> + <data output_type="f32" /> + <input> + <port id="0" precision="I32" /> + <port id="1" precision="I64" /> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="FP32"> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="251" name="__module.model/aten::arange/ConvertLike" type="Convert" version="opset1"> + <data destination_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + </port> + </input> + <output> + <port id="1" precision="I64" names="463"> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="252" name="__module.model/aten::gt/Convert" type="Convert" version="opset1"> + <data destination_type="f32" /> + <input> + <port id="0" precision="I64"> + <dim>-1</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="253" name="Constant_297562" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="792694668" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="254" name="Constant_297563" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="255" name="Gather_297564" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64" names="450" /> + </output> + </layer> + <layer id="256" name="__module.model/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" names="454" /> + </output> + </layer> + <layer id="257" name="__module.model/aten::arange/Constant_2" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="798146588" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="258" name="__module.model/aten::arange/Range_1" type="Range" version="opset4"> + <data output_type="f32" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="FP32" names="456,cache_position"> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="259" name="Constant_260" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="798146592" size="16" /> + <output> + <port id="0" precision="I64" names="464"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="260" name="__module.model/aten::reshape/Reshape" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="465"> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="261" name="__module.model/aten::gt/Greater" type="Greater" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="BOOL" names="466"> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="262" name="__module.model/aten::mul_/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <input> + <port id="0" precision="BOOL"> + <dim>-1</dim> + <dim>-1</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="263" name="__module.model/aten::mul_/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="462,causal_mask.1"> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="264" name="336" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" names="336" /> + </output> + </layer> + <layer id="265" name="__module.model/aten::unsqueeze/Unsqueeze" type="Unsqueeze" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="FP32" names="468"> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="266" name="__module.model/aten::unsqueeze/Unsqueeze_1" type="Unsqueeze" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="FP32" names="469,470,471"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="267" name="Constant_267859" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="268" name="Constant_267861" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="269" name="Constant_267863" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="270" name="__module.model/prim::ListConstruct/Concat_1" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64" names="473"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="271" name="__module.model/aten::expand/Broadcast" type="Broadcast" version="opset3"> + <data mode="bidirectional" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="474,477,478,479,487,488,489,492_1,493_1,494_1,causal_mask.5"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="272" name="Constant_220554" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="273" name="SliceAssign_404/Reshape_3" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="274" name="Constant_139074" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="275" name="SliceAssign_404/ShapeOf" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="276" name="SliceAssign_404/ReduceProd" type="ReduceProd" version="opset1"> + <data keep_dims="false" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" /> + </output> + </layer> + <layer id="277" name="Constant_139075" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="278" name="SliceAssign_404/Range" type="Range" version="opset4"> + <data output_type="i64" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="279" name="SliceAssign_404/Reshape" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64"> + <dim>-1</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="280" name="__module.model/aten::slice/Reshape_20" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="281" name="__module.model/aten::slice/Reshape_22" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="282" name="__module.model/aten::slice/Reshape_23" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="283" name="SliceAssign_404/Slice_2" type="Slice" version="opset8"> + <input> + <port id="0" precision="I64"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="I64"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="284" name="Constant_139077" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="798146592" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="285" name="SliceAssign_404/Reshape_4" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="286" name="__module.model/aten::slice/Reshape_36" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="287" name="__module.model/aten::slice/Reshape_38" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="288" name="__module.model/aten::slice/Reshape_39" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="289" name="__module.model/aten::slice/Slice_5" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="480,490,495_1"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="290" name="__module.model/aten::unsqueeze/Unsqueeze_2" type="Unsqueeze" version="opset1"> + <input> + <port id="0" precision="I64"> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" names="482"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="291" name="__module.model/aten::unsqueeze/Unsqueeze_3" type="Unsqueeze" version="opset1"> + <input> + <port id="0" precision="I64"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + </port> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" names="483,484"> + <dim>-1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="292" name="__module.model/aten::add/Convert" type="Convert" version="opset1"> + <data destination_type="f32" /> + <input> + <port id="0" precision="I64"> + <dim>-1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="293" name="__module.model/aten::add/Add_1" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>-1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="485,padding_mask.1"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="294" name="Constant_290053" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1, 1" offset="0" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="295" name="__module.model/aten::eq/Equal" type="Equal" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="BOOL" names="486,padding_mask"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="296" name="__module.model/aten::masked_fill/ConvertLike" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="798146568" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="297" name="__module.model/aten::masked_fill/Select" type="Select" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="BOOL"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="1" precision="FP32" /> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </input> + <output> + <port id="3" precision="FP32" names="491"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="298" name="__module.model/aten::copy_/ShapeOf" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="299" name="__module.model/aten::copy_/Broadcast" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="495"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="300" name="Constant_220555" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="301" name="SliceAssign_404/Reshape_5" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="302" name="SliceAssign_404/ScatterNDUpdate" type="ScatterNDUpdate" version="opset4"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + </port> + <port id="1" precision="I64"> + <dim>-1</dim> + <dim>1</dim> + </port> + <port id="2" precision="FP32"> + <dim>-1</dim> + </port> + </input> + <output> + <port id="3" precision="FP32"> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="303" name="SliceAssign_404/Reshape_6" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1110,1111,1112,1267,1268,1269,1424,1425,1426,1581,1582,1583,1738,1739,1740,1895,1896,1897,2052,2053,2054,2209,2210,2211,2366,2367,2368,2523,2524,2525,2680,2681,2682,2837,2838,2839,2994,2995,2996,3151,3152,3153,3308,3309,3310,3465,3466,3467,3622,3623,3624,3779,3780,3781,3936,3937,3938,4093,4094,4095,4250,4251,4252,4407,4408,4409,4564,4565,4566,4721,4722,4723,475,4878,4879,4880,5035,5036,5037,5192,5193,5194,5349,5350,5351,5506,5507,5508,5663,5664,5665,5820,5821,5822,5977,5978,5979,6134,6135,6136,6291,6292,6293,639,640,641,6448,6449,6450,6605,6606,6607,6762,6763,6764,6919,6920,6921,7076,7077,7078,7233,7234,7235,7390,7391,7392,7547,7548,7549,7704,7705,7706,7861,7862,7863,796,797,798,8018,8019,8020,953,954,955"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="304" name="__module.model.layers.0.self_attn/aten::slice/Reshape_60" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="305" name="Constant_297582" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="306" name="Reshape_297583" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="307" name="ShapeOf_297584" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="308" name="Constant_297585" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694668" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="309" name="Constant_297586" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="310" name="Gather_297587" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="311" name="Add_297588" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64" names="638"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="312" name="__module.model.layers.0.self_attn/aten::slice/Reshape_62" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="313" name="__module.model.layers.0.self_attn/aten::slice/Reshape_63" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="314" name="__module.model.layers.0.self_attn/aten::slice/Slice_15" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="642"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="315" name="__module.model.layers.0.self_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> + <data causal="false" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="643,attn_output.1"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="316" name="__module.model.layers.0.self_attn/aten::transpose/ScatterElementsUpdate_3" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="317" name="__module.model.layers.0.self_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="644"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="318" name="Constant_301702" type="Const" version="opset1"> + <data element_type="i64" shape="3" offset="798146608" size="24" /> + <output> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="319" name="__module.model.layers.0.self_attn/aten::view/Reshape_3" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>3</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="647"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="320" name="self.model.layers.0.self_attn.o_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 128" offset="798146632" size="13107200" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="321" name="Convert_386037" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="322" name="self.model.layers.0.self_attn.o_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 1" offset="811253832" size="102400" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="323" name="Convert_386039" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="324" name="self.model.layers.0.self_attn.o_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="325" name="self.model.layers.0.self_attn.o_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="5120, 40, 1" offset="811356232" size="409600" /> + <output> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="326" name="self.model.layers.0.self_attn.o_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="327" name="Constant_386044" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="792684080" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="328" name="Reshape_386045" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="329" name="__module.model.layers.0.self_attn.o_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="330" name="__module.model.layers.0.self_attn.o_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="649,651,hidden_states.17"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="331" name="__module.model.layers.0/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="654,656,667,hidden_states.19,hidden_states.21"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="332" name="Constant_290057" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 5120" offset="811765832" size="20480" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="333" name="Constant_290056" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064860" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="334" name="Constant_290054" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064864" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="335" name="__module.model.layers.0.post_attention_layernorm/aten::pow/Power" type="Power" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="657"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="336" name="Constant_1124" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64" names="658"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="337" name="__module.model.layers.0.post_attention_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> + <data keep_dims="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="659,variance.3"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="338" name="Constant_290055" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064876" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="339" name="__module.model.layers.0.post_attention_layernorm/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="660"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="340" name="__module.model.layers.0.post_attention_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="341" name="__module.model.layers.0.post_attention_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="661"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="342" name="__module.model.layers.0.post_attention_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="662,663,hidden_states.23,hidden_states.25"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="343" name="__module.model.layers.0.post_attention_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="664,666"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="344" name="self.model.layers.0.mlp.gate_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 128" offset="811786312" size="35389440" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="345" name="Convert_384597" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="346" name="self.model.layers.0.mlp.gate_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 1" offset="847175752" size="276480" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="347" name="Convert_384599" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="348" name="self.model.layers.0.mlp.gate_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="349" name="self.model.layers.0.mlp.gate_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="13824, 40, 1" offset="847452232" size="1105920" /> + <output> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="350" name="self.model.layers.0.mlp.gate_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="351" name="Constant_384604" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="848558152" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="352" name="Reshape_384605" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="353" name="__module.model.layers.0.mlp.gate_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="354" name="__module.model.layers.0.mlp.gate_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="672,input.1"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="355" name="__module.model.layers.0.mlp.act_fn/aten::silu/Swish" type="Swish" version="opset4"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="673"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="356" name="self.model.layers.0.mlp.up_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 128" offset="848558168" size="35389440" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="357" name="Convert_384587" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="358" name="self.model.layers.0.mlp.up_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 1" offset="883947608" size="276480" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="359" name="Convert_384589" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="360" name="self.model.layers.0.mlp.up_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="361" name="self.model.layers.0.mlp.up_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="13824, 40, 1" offset="884224088" size="1105920" /> + <output> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="362" name="self.model.layers.0.mlp.up_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="363" name="Constant_384594" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="848558152" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="364" name="Reshape_384595" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="365" name="__module.model.layers.0.mlp.up_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="366" name="__module.model.layers.0.mlp.up_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="675"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="367" name="__module.model.layers.0.mlp/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="676"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="368" name="self.model.layers.0.mlp.down_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 108, 128" offset="885330008" size="35389440" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="369" name="Convert_384607" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="370" name="self.model.layers.0.mlp.down_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 108, 1" offset="920719448" size="276480" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="371" name="Convert_384609" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="372" name="self.model.layers.0.mlp.down_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="373" name="self.model.layers.0.mlp.down_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="5120, 108, 1" offset="920995928" size="1105920" /> + <output> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="374" name="self.model.layers.0.mlp.down_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="375" name="Constant_384614" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="922101848" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="376" name="Reshape_384615" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="377" name="__module.model.layers.0.mlp.down_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="378" name="__module.model.layers.0.mlp.down_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="678,hidden_states.27"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="379" name="__module.model.layers.0/aten::add/Add_1" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="679,681,689,700,hidden_states.29,hidden_states.31"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="380" name="Constant_290061" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 5120" offset="922101864" size="20480" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="381" name="Constant_290060" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064860" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="382" name="Constant_290058" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064864" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="383" name="__module.model.layers.1.input_layernorm/aten::pow/Power" type="Power" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="690"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="384" name="Constant_1198" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64" names="691"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="385" name="__module.model.layers.1.input_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> + <data keep_dims="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="692,variance.5"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="386" name="Constant_290059" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064876" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="387" name="__module.model.layers.1.input_layernorm/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="693"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="388" name="__module.model.layers.1.input_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="389" name="__module.model.layers.1.input_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="694"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="390" name="__module.model.layers.1.input_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="695,696,hidden_states.33,hidden_states.35"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="391" name="__module.model.layers.1.input_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="697,699,hidden_states.37"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="392" name="self.model.layers.1.self_attn.q_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 128" offset="922122344" size="13107200" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="393" name="Convert_386047" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="394" name="self.model.layers.1.self_attn.q_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 1" offset="935229544" size="102400" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="395" name="Convert_386049" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="396" name="self.model.layers.1.self_attn.q_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="397" name="self.model.layers.1.self_attn.q_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="5120, 40, 1" offset="935331944" size="409600" /> + <output> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="398" name="self.model.layers.1.self_attn.q_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="399" name="Constant_386054" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="792684080" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="400" name="Reshape_386055" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="401" name="__module.model.layers.1.self_attn.q_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="402" name="__module.model.layers.1.self_attn.q_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="403" name="self.model.layers.1.self_attn.q_proj.bias" type="Const" version="opset1"> + <data element_type="bf16" shape="5120" offset="935741544" size="10240" /> + <output> + <port id="0" precision="BF16" names="self.model.layers.1.self_attn.q_proj.bias"> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="404" name="__module.model.layers.1.self_attn.q_proj/prim::PythonOp/ConvertLike_1" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="BF16"> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="405" name="__module.model.layers.1.self_attn.q_proj/prim::PythonOp/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="709,query_states.3"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="406" name="Constant_301703" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="792694336" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="407" name="__module.model.layers.1.self_attn/aten::view/Reshape" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="717"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="408" name="__module.model.layers.1.self_attn/aten::transpose/ScatterElementsUpdate" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="409" name="__module.model.layers.1.self_attn/aten::transpose/Transpose" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="718,q.3"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="410" name="__module.model.layers.1.self_attn/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="727"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="411" name="__module.model.layers.1.self_attn/aten::size/ShapeOf_3" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="412" name="__module.model.layers.1.self_attn/aten::size/Constant_3" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="413" name="__module.model.layers.1.self_attn/aten::size/Gather_3" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="728,733" /> + </output> + </layer> + <layer id="414" name="__module.model.layers.1.self_attn/aten::floor_divide/Divide_1" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" /> + </output> + </layer> + <layer id="415" name="__module.model.layers.1.self_attn/aten::floor_divide/Floor_1" type="Floor" version="opset1"> + <input> + <port id="0" precision="I64" /> + </input> + <output> + <port id="1" precision="I64" names="730,731,735,736" /> + </output> + </layer> + <layer id="416" name="Constant_220560" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="417" name="__module.model.layers.1.self_attn/aten::slice/Reshape_5" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="418" name="__module.model.layers.1.self_attn/aten::slice/Reshape_1" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694676" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="419" name="__module.model.layers.1.self_attn/aten::slice/Reshape_2" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="420" name="__module.model.layers.1.self_attn/aten::slice/Reshape_3" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="421" name="__module.model.layers.1.self_attn/aten::slice/Slice" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="737,x2.5"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="422" name="Constant_290062" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1, 1" offset="792694684" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="423" name="__module.model.layers.1.self_attn/aten::neg/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="738"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="424" name="__module.model.layers.1.self_attn/aten::slice/Reshape_4" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="425" name="__module.model.layers.1.self_attn/aten::slice/Reshape_6" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="426" name="__module.model.layers.1.self_attn/aten::slice/Reshape_7" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="427" name="__module.model.layers.1.self_attn/aten::slice/Slice_1" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="732"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="428" name="__module.model.layers.1.self_attn/aten::cat/Concat" type="Concat" version="opset1"> + <data axis="-1" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="740"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="429" name="__module.model.layers.1.self_attn/aten::mul/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="741"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="430" name="__module.model.layers.1.self_attn/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="742"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="431" name="Constant_340801" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="432" name="Constant_340794" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="12" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="433" name="Constant_340796" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="434" name="Constant_340798" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="20" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="435" name="Concat_340799" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="436" name="Broadcast_340802" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32" /> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="437" name="ReadValue_333080" type="ReadValue" version="opset6"> + <data variable_id="past_key_values.1.keypresent.1.key" variable_type="f32" variable_shape="?,8,?,128" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="past_key_values.1.key"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="438" name="Constant_325315" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="439" name="Gather_325316" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="440" name="self.model.layers.1.self_attn.k_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 128" offset="935751784" size="2621440" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="441" name="Convert_387007" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="442" name="self.model.layers.1.self_attn.k_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 1" offset="938373224" size="20480" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="443" name="Convert_387009" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="444" name="self.model.layers.1.self_attn.k_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="445" name="self.model.layers.1.self_attn.k_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="1024, 40, 1" offset="938393704" size="81920" /> + <output> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="446" name="self.model.layers.1.self_attn.k_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="447" name="Constant_387014" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795418528" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="448" name="Reshape_387015" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="449" name="__module.model.layers.1.self_attn.k_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="450" name="__module.model.layers.1.self_attn.k_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="451" name="self.model.layers.1.self_attn.k_proj.bias" type="Const" version="opset1"> + <data element_type="bf16" shape="1024" offset="938475624" size="2048" /> + <output> + <port id="0" precision="BF16" names="self.model.layers.1.self_attn.k_proj.bias"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="452" name="__module.model.layers.1.self_attn.k_proj/prim::PythonOp/ConvertLike_1" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="BF16"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="453" name="__module.model.layers.1.self_attn.k_proj/prim::PythonOp/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="712,key_states.9"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="454" name="Constant_301704" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420592" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="455" name="__module.model.layers.1.self_attn/aten::view/Reshape_1" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="720"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="456" name="__module.model.layers.1.self_attn/aten::transpose/ScatterElementsUpdate_1" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="457" name="__module.model.layers.1.self_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="721,k.3"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="458" name="__module.model.layers.1.self_attn/aten::mul/Multiply_2" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="743"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="459" name="__module.model.layers.1.self_attn/aten::size/ShapeOf_5" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="460" name="__module.model.layers.1.self_attn/aten::size/Constant_5" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="461" name="__module.model.layers.1.self_attn/aten::size/Gather_5" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="744,749" /> + </output> + </layer> + <layer id="462" name="__module.model.layers.1.self_attn/aten::floor_divide/Divide_3" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" /> + </output> + </layer> + <layer id="463" name="__module.model.layers.1.self_attn/aten::floor_divide/Floor_3" type="Floor" version="opset1"> + <input> + <port id="0" precision="I64" /> + </input> + <output> + <port id="1" precision="I64" names="746,747,751,752" /> + </output> + </layer> + <layer id="464" name="Constant_220561" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="465" name="__module.model.layers.1.self_attn/aten::slice/Reshape_13" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="466" name="__module.model.layers.1.self_attn/aten::slice/Reshape_9" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694676" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="467" name="__module.model.layers.1.self_attn/aten::slice/Reshape_10" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="468" name="__module.model.layers.1.self_attn/aten::slice/Reshape_11" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="469" name="__module.model.layers.1.self_attn/aten::slice/Slice_2" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="753,x2.7"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="470" name="Constant_290063" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1, 1" offset="792694684" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="471" name="__module.model.layers.1.self_attn/aten::neg/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="754"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="472" name="__module.model.layers.1.self_attn/aten::slice/Reshape_12" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="473" name="__module.model.layers.1.self_attn/aten::slice/Reshape_14" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="474" name="__module.model.layers.1.self_attn/aten::slice/Reshape_15" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="475" name="__module.model.layers.1.self_attn/aten::slice/Slice_3" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="748"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="476" name="__module.model.layers.1.self_attn/aten::cat/Concat_1" type="Concat" version="opset1"> + <data axis="-1" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="756"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="477" name="__module.model.layers.1.self_attn/aten::mul/Multiply_3" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="757"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="478" name="__module.model.layers.1.self_attn/aten::add/Add_1" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="758"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="479" name="__module.model.layers.1.self_attn/aten::cat/Concat_2" type="Concat" version="opset1"> + <data axis="-2" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="present.1.key"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="480" name="__module.model.layers.1.self_attn/aten::unsqueeze/Unsqueeze_2" type="Unsqueeze" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="FP32" names="770,771,772"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="481" name="__module.model.layers.1.self_attn/aten::size/ShapeOf_6" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="482" name="Constant_302369" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="938477672" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="483" name="Constant_302370" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="484" name="Gather_302371" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="485" name="Constant_267870" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="795420624" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="486" name="Constant_276226" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795420632" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="487" name="Constant_276227" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="488" name="Gather_276228" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="489" name="__module.model.layers.1.self_attn/prim::ListConstruct/Concat_2" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="3" precision="I64" names="773"> + <dim>5</dim> + </port> + </output> + </layer> + <layer id="490" name="__module.model.layers.1.self_attn/aten::expand/Broadcast" type="Broadcast" version="opset3"> + <data mode="bidirectional" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>5</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="774,hidden_states.41"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="491" name="Constant_301705" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420648" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="492" name="__module.model.layers.1.self_attn/aten::reshape/Reshape" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="778,key_states.11"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="493" name="Constant_340814" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="494" name="Constant_340807" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="12" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="495" name="Constant_340809" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="496" name="Constant_340811" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="20" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="497" name="Concat_340812" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="498" name="Broadcast_340815" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32" /> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="499" name="ReadValue_333082" type="ReadValue" version="opset6"> + <data variable_id="past_key_values.1.valuepresent.1.value" variable_type="f32" variable_shape="?,8,?,128" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="past_key_values.1.value"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="500" name="Constant_325318" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="501" name="Gather_325319" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="502" name="self.model.layers.1.self_attn.v_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 128" offset="938477688" size="2621440" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="503" name="Convert_387017" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="504" name="self.model.layers.1.self_attn.v_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 1" offset="941099128" size="20480" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="505" name="Convert_387019" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="506" name="self.model.layers.1.self_attn.v_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="507" name="self.model.layers.1.self_attn.v_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="1024, 40, 1" offset="941119608" size="81920" /> + <output> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="508" name="self.model.layers.1.self_attn.v_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="509" name="Constant_387024" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795418528" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="510" name="Reshape_387025" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="511" name="__module.model.layers.1.self_attn.v_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="512" name="__module.model.layers.1.self_attn.v_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="513" name="self.model.layers.1.self_attn.v_proj.bias" type="Const" version="opset1"> + <data element_type="bf16" shape="1024" offset="941201528" size="2048" /> + <output> + <port id="0" precision="BF16" names="self.model.layers.1.self_attn.v_proj.bias"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="514" name="__module.model.layers.1.self_attn.v_proj/prim::PythonOp/ConvertLike_1" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="BF16"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="515" name="__module.model.layers.1.self_attn.v_proj/prim::PythonOp/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="715,value_states.3"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="516" name="Constant_301706" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420592" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="517" name="__module.model.layers.1.self_attn/aten::view/Reshape_2" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="723"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="518" name="__module.model.layers.1.self_attn/aten::transpose/ScatterElementsUpdate_2" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="519" name="__module.model.layers.1.self_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="724"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="520" name="__module.model.layers.1.self_attn/aten::cat/Concat_3" type="Concat" version="opset1"> + <data axis="-2" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="present.1.value"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="521" name="__module.model.layers.1.self_attn/aten::unsqueeze/Unsqueeze_3" type="Unsqueeze" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="FP32" names="786,787,788"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="522" name="__module.model.layers.1.self_attn/aten::size/ShapeOf_10" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="523" name="Constant_302091" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="524" name="__module.model.layers.1.self_attn/aten::size/Constant_11" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="525" name="__module.model.layers.1.self_attn/aten::size/Gather_11" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="780"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="526" name="Constant_267888" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="795420624" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="527" name="Constant_276236" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795420632" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="528" name="Constant_276237" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="529" name="Gather_276238" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="530" name="__module.model.layers.1.self_attn/prim::ListConstruct/Concat_5" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="4" precision="I64" names="789"> + <dim>5</dim> + </port> + </output> + </layer> + <layer id="531" name="__module.model.layers.1.self_attn/aten::expand/Broadcast_1" type="Broadcast" version="opset3"> + <data mode="bidirectional" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>5</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="790,hidden_states.45"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="532" name="Constant_301707" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420648" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="533" name="__module.model.layers.1.self_attn/aten::reshape/Reshape_1" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="794"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="534" name="__module.model.layers.1.self_attn/aten::slice/Reshape_60" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="535" name="ShapeOf_297666" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="536" name="Constant_297667" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694668" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="537" name="Constant_297668" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="538" name="Gather_297669" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="539" name="ShapeOf_297670" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="540" name="Constant_297671" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694668" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="541" name="Constant_297672" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="542" name="Gather_297673" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="543" name="Add_297674" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64" names="795"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="544" name="__module.model.layers.1.self_attn/aten::slice/Reshape_62" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="545" name="__module.model.layers.1.self_attn/aten::slice/Reshape_63" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="546" name="__module.model.layers.1.self_attn/aten::slice/Slice_15" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="799"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="547" name="__module.model.layers.1.self_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> + <data causal="false" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="800,attn_output.5"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="548" name="__module.model.layers.1.self_attn/aten::transpose/ScatterElementsUpdate_3" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="549" name="__module.model.layers.1.self_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="801"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="550" name="Constant_301708" type="Const" version="opset1"> + <data element_type="i64" shape="3" offset="798146608" size="24" /> + <output> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="551" name="__module.model.layers.1.self_attn/aten::view/Reshape_3" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>3</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="804"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="552" name="self.model.layers.1.self_attn.o_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 128" offset="941203576" size="13107200" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="553" name="Convert_386057" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="554" name="self.model.layers.1.self_attn.o_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 1" offset="954310776" size="102400" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="555" name="Convert_386059" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="556" name="self.model.layers.1.self_attn.o_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="557" name="self.model.layers.1.self_attn.o_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="5120, 40, 1" offset="954413176" size="409600" /> + <output> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="558" name="self.model.layers.1.self_attn.o_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="559" name="Constant_386064" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="792684080" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="560" name="Reshape_386065" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="561" name="__module.model.layers.1.self_attn.o_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="562" name="__module.model.layers.1.self_attn.o_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="806,808,hidden_states.47"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="563" name="__module.model.layers.1/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="811,813,824,hidden_states.49,hidden_states.51"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="564" name="Constant_290067" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 5120" offset="954822776" size="20480" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="565" name="Constant_290066" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064860" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="566" name="Constant_290064" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064864" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="567" name="__module.model.layers.1.post_attention_layernorm/aten::pow/Power" type="Power" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="814"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="568" name="Constant_1796" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64" names="815"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="569" name="__module.model.layers.1.post_attention_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> + <data keep_dims="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="816,variance.7"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="570" name="Constant_290065" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064876" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="571" name="__module.model.layers.1.post_attention_layernorm/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="817"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="572" name="__module.model.layers.1.post_attention_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="573" name="__module.model.layers.1.post_attention_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="818"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="574" name="__module.model.layers.1.post_attention_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="819,820,hidden_states.53,hidden_states.55"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="575" name="__module.model.layers.1.post_attention_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="821,823"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="576" name="self.model.layers.1.mlp.gate_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 128" offset="954843256" size="35389440" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="577" name="Convert_384627" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="578" name="self.model.layers.1.mlp.gate_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 1" offset="990232696" size="276480" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="579" name="Convert_384629" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="580" name="self.model.layers.1.mlp.gate_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="581" name="self.model.layers.1.mlp.gate_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="13824, 40, 1" offset="990509176" size="1105920" /> + <output> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="582" name="self.model.layers.1.mlp.gate_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="583" name="Constant_384634" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="848558152" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="584" name="Reshape_384635" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="585" name="__module.model.layers.1.mlp.gate_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="586" name="__module.model.layers.1.mlp.gate_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="829,input.3"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="587" name="__module.model.layers.1.mlp.act_fn/aten::silu/Swish" type="Swish" version="opset4"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="830"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="588" name="self.model.layers.1.mlp.up_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 128" offset="991615096" size="35389440" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="589" name="Convert_384617" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="590" name="self.model.layers.1.mlp.up_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 1" offset="1027004536" size="276480" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="591" name="Convert_384619" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="592" name="self.model.layers.1.mlp.up_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="593" name="self.model.layers.1.mlp.up_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="13824, 40, 1" offset="1027281016" size="1105920" /> + <output> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="594" name="self.model.layers.1.mlp.up_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="595" name="Constant_384624" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="848558152" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="596" name="Reshape_384625" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="597" name="__module.model.layers.1.mlp.up_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="598" name="__module.model.layers.1.mlp.up_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="832"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="599" name="__module.model.layers.1.mlp/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="833"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="600" name="self.model.layers.1.mlp.down_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 108, 128" offset="1028386936" size="35389440" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="601" name="Convert_384637" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="602" name="self.model.layers.1.mlp.down_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 108, 1" offset="1063776376" size="276480" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="603" name="Convert_384639" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="604" name="self.model.layers.1.mlp.down_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="605" name="self.model.layers.1.mlp.down_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="5120, 108, 1" offset="1064052856" size="1105920" /> + <output> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="606" name="self.model.layers.1.mlp.down_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="607" name="Constant_384644" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="922101848" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="608" name="Reshape_384645" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="609" name="__module.model.layers.1.mlp.down_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="610" name="__module.model.layers.1.mlp.down_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="835,hidden_states.57"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="611" name="__module.model.layers.1/aten::add/Add_1" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="836,838,846,857,hidden_states.59,hidden_states.61"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="612" name="Constant_290071" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 5120" offset="1065158776" size="20480" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="613" name="Constant_290070" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064860" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="614" name="Constant_290068" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064864" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="615" name="__module.model.layers.2.input_layernorm/aten::pow/Power" type="Power" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="847"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="616" name="Constant_1870" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64" names="848"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="617" name="__module.model.layers.2.input_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> + <data keep_dims="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="849,variance.9"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="618" name="Constant_290069" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064876" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="619" name="__module.model.layers.2.input_layernorm/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="850"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="620" name="__module.model.layers.2.input_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="621" name="__module.model.layers.2.input_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="851"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="622" name="__module.model.layers.2.input_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="852,853,hidden_states.63,hidden_states.65"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="623" name="__module.model.layers.2.input_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="854,856,hidden_states.67"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="624" name="self.model.layers.2.self_attn.q_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 128" offset="1065179256" size="13107200" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="625" name="Convert_386067" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="626" name="self.model.layers.2.self_attn.q_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 1" offset="1078286456" size="102400" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="627" name="Convert_386069" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="628" name="self.model.layers.2.self_attn.q_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="629" name="self.model.layers.2.self_attn.q_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="5120, 40, 1" offset="1078388856" size="409600" /> + <output> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="630" name="self.model.layers.2.self_attn.q_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="631" name="Constant_386074" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="792684080" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="632" name="Reshape_386075" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="633" name="__module.model.layers.2.self_attn.q_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="634" name="__module.model.layers.2.self_attn.q_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="635" name="self.model.layers.2.self_attn.q_proj.bias" type="Const" version="opset1"> + <data element_type="bf16" shape="5120" offset="1078798456" size="10240" /> + <output> + <port id="0" precision="BF16" names="self.model.layers.2.self_attn.q_proj.bias"> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="636" name="__module.model.layers.2.self_attn.q_proj/prim::PythonOp/ConvertLike_1" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="BF16"> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="637" name="__module.model.layers.2.self_attn.q_proj/prim::PythonOp/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="866,query_states.5"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="638" name="Constant_301709" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="792694336" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="639" name="__module.model.layers.2.self_attn/aten::view/Reshape" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="874"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="640" name="__module.model.layers.2.self_attn/aten::transpose/ScatterElementsUpdate" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="641" name="__module.model.layers.2.self_attn/aten::transpose/Transpose" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="875,q.5"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="642" name="__module.model.layers.2.self_attn/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="884"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="643" name="__module.model.layers.2.self_attn/aten::size/ShapeOf_3" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="644" name="__module.model.layers.2.self_attn/aten::size/Constant_3" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="645" name="__module.model.layers.2.self_attn/aten::size/Gather_3" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="885,890" /> + </output> + </layer> + <layer id="646" name="__module.model.layers.2.self_attn/aten::floor_divide/Divide_1" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" /> + </output> + </layer> + <layer id="647" name="__module.model.layers.2.self_attn/aten::floor_divide/Floor_1" type="Floor" version="opset1"> + <input> + <port id="0" precision="I64" /> + </input> + <output> + <port id="1" precision="I64" names="887,888,892,893" /> + </output> + </layer> + <layer id="648" name="Constant_220575" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="649" name="__module.model.layers.2.self_attn/aten::slice/Reshape_5" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="650" name="__module.model.layers.2.self_attn/aten::slice/Reshape_1" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694676" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="651" name="__module.model.layers.2.self_attn/aten::slice/Reshape_2" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="652" name="__module.model.layers.2.self_attn/aten::slice/Reshape_3" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="653" name="__module.model.layers.2.self_attn/aten::slice/Slice" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="894,x2.9"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="654" name="Constant_290072" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1, 1" offset="792694684" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="655" name="__module.model.layers.2.self_attn/aten::neg/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="895"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="656" name="__module.model.layers.2.self_attn/aten::slice/Reshape_4" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="657" name="__module.model.layers.2.self_attn/aten::slice/Reshape_6" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="658" name="__module.model.layers.2.self_attn/aten::slice/Reshape_7" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="659" name="__module.model.layers.2.self_attn/aten::slice/Slice_1" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="889"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="660" name="__module.model.layers.2.self_attn/aten::cat/Concat" type="Concat" version="opset1"> + <data axis="-1" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="897"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="661" name="__module.model.layers.2.self_attn/aten::mul/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="898"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="662" name="__module.model.layers.2.self_attn/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="899"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="663" name="Constant_340827" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="664" name="Constant_340820" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="12" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="665" name="Constant_340822" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="666" name="Constant_340824" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="20" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="667" name="Concat_340825" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="668" name="Broadcast_340828" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32" /> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="669" name="ReadValue_333124" type="ReadValue" version="opset6"> + <data variable_id="past_key_values.2.keypresent.2.key" variable_type="f32" variable_shape="?,8,?,128" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="past_key_values.2.key"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="670" name="Constant_325321" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="671" name="Gather_325322" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="672" name="self.model.layers.2.self_attn.k_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 128" offset="1078808696" size="2621440" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="673" name="Convert_387027" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="674" name="self.model.layers.2.self_attn.k_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 1" offset="1081430136" size="20480" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="675" name="Convert_387029" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="676" name="self.model.layers.2.self_attn.k_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="677" name="self.model.layers.2.self_attn.k_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="1024, 40, 1" offset="1081450616" size="81920" /> + <output> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="678" name="self.model.layers.2.self_attn.k_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="679" name="Constant_387034" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795418528" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="680" name="Reshape_387035" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="681" name="__module.model.layers.2.self_attn.k_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="682" name="__module.model.layers.2.self_attn.k_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="683" name="self.model.layers.2.self_attn.k_proj.bias" type="Const" version="opset1"> + <data element_type="bf16" shape="1024" offset="1081532536" size="2048" /> + <output> + <port id="0" precision="BF16" names="self.model.layers.2.self_attn.k_proj.bias"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="684" name="__module.model.layers.2.self_attn.k_proj/prim::PythonOp/ConvertLike_1" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="BF16"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="685" name="__module.model.layers.2.self_attn.k_proj/prim::PythonOp/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="869,key_states.13"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="686" name="Constant_301710" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420592" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="687" name="__module.model.layers.2.self_attn/aten::view/Reshape_1" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="877"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="688" name="__module.model.layers.2.self_attn/aten::transpose/ScatterElementsUpdate_1" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="689" name="__module.model.layers.2.self_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="878,k.5"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="690" name="__module.model.layers.2.self_attn/aten::mul/Multiply_2" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="900"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="691" name="__module.model.layers.2.self_attn/aten::size/ShapeOf_5" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="692" name="__module.model.layers.2.self_attn/aten::size/Constant_5" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="693" name="__module.model.layers.2.self_attn/aten::size/Gather_5" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="901,906" /> + </output> + </layer> + <layer id="694" name="__module.model.layers.2.self_attn/aten::floor_divide/Divide_3" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" /> + </output> + </layer> + <layer id="695" name="__module.model.layers.2.self_attn/aten::floor_divide/Floor_3" type="Floor" version="opset1"> + <input> + <port id="0" precision="I64" /> + </input> + <output> + <port id="1" precision="I64" names="903,904,908,909" /> + </output> + </layer> + <layer id="696" name="Constant_220576" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="697" name="__module.model.layers.2.self_attn/aten::slice/Reshape_13" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="698" name="__module.model.layers.2.self_attn/aten::slice/Reshape_9" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694676" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="699" name="__module.model.layers.2.self_attn/aten::slice/Reshape_10" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="700" name="__module.model.layers.2.self_attn/aten::slice/Reshape_11" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="701" name="__module.model.layers.2.self_attn/aten::slice/Slice_2" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="910,x2.11"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="702" name="Constant_290073" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1, 1" offset="792694684" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="703" name="__module.model.layers.2.self_attn/aten::neg/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="911"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="704" name="__module.model.layers.2.self_attn/aten::slice/Reshape_12" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="705" name="__module.model.layers.2.self_attn/aten::slice/Reshape_14" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="706" name="__module.model.layers.2.self_attn/aten::slice/Reshape_15" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="707" name="__module.model.layers.2.self_attn/aten::slice/Slice_3" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="905"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="708" name="__module.model.layers.2.self_attn/aten::cat/Concat_1" type="Concat" version="opset1"> + <data axis="-1" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="913"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="709" name="__module.model.layers.2.self_attn/aten::mul/Multiply_3" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="914"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="710" name="__module.model.layers.2.self_attn/aten::add/Add_1" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="915"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="711" name="__module.model.layers.2.self_attn/aten::cat/Concat_2" type="Concat" version="opset1"> + <data axis="-2" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="present.2.key"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="712" name="__module.model.layers.2.self_attn/aten::unsqueeze/Unsqueeze_2" type="Unsqueeze" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="FP32" names="927,928,929"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="713" name="__module.model.layers.2.self_attn/aten::size/ShapeOf_6" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="714" name="Constant_302374" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="938477672" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="715" name="Constant_302375" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="716" name="Gather_302376" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="717" name="Constant_267906" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="795420624" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="718" name="Constant_276261" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795420632" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="719" name="Constant_276262" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="720" name="Gather_276263" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="721" name="__module.model.layers.2.self_attn/prim::ListConstruct/Concat_2" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="3" precision="I64" names="930"> + <dim>5</dim> + </port> + </output> + </layer> + <layer id="722" name="__module.model.layers.2.self_attn/aten::expand/Broadcast" type="Broadcast" version="opset3"> + <data mode="bidirectional" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>5</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="931,hidden_states.71"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="723" name="Constant_301711" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420648" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="724" name="__module.model.layers.2.self_attn/aten::reshape/Reshape" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="935,key_states.15"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="725" name="Constant_340840" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="726" name="Constant_340833" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="12" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="727" name="Constant_340835" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="728" name="Constant_340837" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="20" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="729" name="Concat_340838" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="730" name="Broadcast_340841" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32" /> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="731" name="ReadValue_333126" type="ReadValue" version="opset6"> + <data variable_id="past_key_values.2.valuepresent.2.value" variable_type="f32" variable_shape="?,8,?,128" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="past_key_values.2.value"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="732" name="Constant_325324" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="733" name="Gather_325325" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="734" name="self.model.layers.2.self_attn.v_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 128" offset="1081534584" size="2621440" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="735" name="Convert_387037" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="736" name="self.model.layers.2.self_attn.v_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 1" offset="1084156024" size="20480" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="737" name="Convert_387039" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="738" name="self.model.layers.2.self_attn.v_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="739" name="self.model.layers.2.self_attn.v_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="1024, 40, 1" offset="1084176504" size="81920" /> + <output> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="740" name="self.model.layers.2.self_attn.v_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="741" name="Constant_387044" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795418528" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="742" name="Reshape_387045" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="743" name="__module.model.layers.2.self_attn.v_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="744" name="__module.model.layers.2.self_attn.v_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="745" name="self.model.layers.2.self_attn.v_proj.bias" type="Const" version="opset1"> + <data element_type="bf16" shape="1024" offset="1084258424" size="2048" /> + <output> + <port id="0" precision="BF16" names="self.model.layers.2.self_attn.v_proj.bias"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="746" name="__module.model.layers.2.self_attn.v_proj/prim::PythonOp/ConvertLike_1" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="BF16"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="747" name="__module.model.layers.2.self_attn.v_proj/prim::PythonOp/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="872,value_states.5"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="748" name="Constant_301712" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420592" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="749" name="__module.model.layers.2.self_attn/aten::view/Reshape_2" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="880"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="750" name="__module.model.layers.2.self_attn/aten::transpose/ScatterElementsUpdate_2" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="751" name="__module.model.layers.2.self_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="881"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="752" name="__module.model.layers.2.self_attn/aten::cat/Concat_3" type="Concat" version="opset1"> + <data axis="-2" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="present.2.value"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="753" name="__module.model.layers.2.self_attn/aten::unsqueeze/Unsqueeze_3" type="Unsqueeze" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="FP32" names="943,944,945"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="754" name="__module.model.layers.2.self_attn/aten::size/ShapeOf_10" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="755" name="Constant_302097" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="756" name="__module.model.layers.2.self_attn/aten::size/Constant_11" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="757" name="__module.model.layers.2.self_attn/aten::size/Gather_11" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="937"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="758" name="Constant_267924" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="795420624" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="759" name="Constant_276271" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795420632" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="760" name="Constant_276272" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="761" name="Gather_276273" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="762" name="__module.model.layers.2.self_attn/prim::ListConstruct/Concat_5" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="4" precision="I64" names="946"> + <dim>5</dim> + </port> + </output> + </layer> + <layer id="763" name="__module.model.layers.2.self_attn/aten::expand/Broadcast_1" type="Broadcast" version="opset3"> + <data mode="bidirectional" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>5</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="947,hidden_states.75"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="764" name="Constant_301713" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420648" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="765" name="__module.model.layers.2.self_attn/aten::reshape/Reshape_1" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="951"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="766" name="__module.model.layers.2.self_attn/aten::slice/Reshape_60" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="767" name="ShapeOf_297752" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="768" name="Constant_297753" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694668" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="769" name="Constant_297754" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="770" name="Gather_297755" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="771" name="ShapeOf_297756" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="772" name="Constant_297757" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694668" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="773" name="Constant_297758" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="774" name="Gather_297759" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="775" name="Add_297760" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64" names="952"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="776" name="__module.model.layers.2.self_attn/aten::slice/Reshape_62" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="777" name="__module.model.layers.2.self_attn/aten::slice/Reshape_63" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="778" name="__module.model.layers.2.self_attn/aten::slice/Slice_15" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="956"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="779" name="__module.model.layers.2.self_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> + <data causal="false" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="957,attn_output.9"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="780" name="__module.model.layers.2.self_attn/aten::transpose/ScatterElementsUpdate_3" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="781" name="__module.model.layers.2.self_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="958"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="782" name="Constant_301714" type="Const" version="opset1"> + <data element_type="i64" shape="3" offset="798146608" size="24" /> + <output> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="783" name="__module.model.layers.2.self_attn/aten::view/Reshape_3" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>3</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="961"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="784" name="self.model.layers.2.self_attn.o_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 128" offset="1084260472" size="13107200" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="785" name="Convert_386077" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="786" name="self.model.layers.2.self_attn.o_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 1" offset="1097367672" size="102400" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="787" name="Convert_386079" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="788" name="self.model.layers.2.self_attn.o_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="789" name="self.model.layers.2.self_attn.o_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="5120, 40, 1" offset="1097470072" size="409600" /> + <output> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="790" name="self.model.layers.2.self_attn.o_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="791" name="Constant_386084" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="792684080" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="792" name="Reshape_386085" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="793" name="__module.model.layers.2.self_attn.o_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="794" name="__module.model.layers.2.self_attn.o_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="963,965,hidden_states.77"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="795" name="__module.model.layers.2/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="968,970,981,hidden_states.79,hidden_states.81"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="796" name="Constant_290077" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 5120" offset="1097879672" size="20480" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="797" name="Constant_290076" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064860" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="798" name="Constant_290074" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064864" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="799" name="__module.model.layers.2.post_attention_layernorm/aten::pow/Power" type="Power" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="971"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="800" name="Constant_2468" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64" names="972"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="801" name="__module.model.layers.2.post_attention_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> + <data keep_dims="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="973,variance.11"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="802" name="Constant_290075" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064876" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="803" name="__module.model.layers.2.post_attention_layernorm/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="974"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="804" name="__module.model.layers.2.post_attention_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="805" name="__module.model.layers.2.post_attention_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="975"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="806" name="__module.model.layers.2.post_attention_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="976,977,hidden_states.83,hidden_states.85"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="807" name="__module.model.layers.2.post_attention_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="978,980"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="808" name="self.model.layers.2.mlp.gate_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 128" offset="1097900152" size="35389440" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="809" name="Convert_384657" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="810" name="self.model.layers.2.mlp.gate_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 1" offset="1133289592" size="276480" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="811" name="Convert_384659" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="812" name="self.model.layers.2.mlp.gate_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="813" name="self.model.layers.2.mlp.gate_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="13824, 40, 1" offset="1133566072" size="1105920" /> + <output> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="814" name="self.model.layers.2.mlp.gate_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="815" name="Constant_384664" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="848558152" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="816" name="Reshape_384665" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="817" name="__module.model.layers.2.mlp.gate_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="818" name="__module.model.layers.2.mlp.gate_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="986,input.5"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="819" name="__module.model.layers.2.mlp.act_fn/aten::silu/Swish" type="Swish" version="opset4"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="987"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="820" name="self.model.layers.2.mlp.up_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 128" offset="1134671992" size="35389440" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="821" name="Convert_384647" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="822" name="self.model.layers.2.mlp.up_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 1" offset="1170061432" size="276480" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="823" name="Convert_384649" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="824" name="self.model.layers.2.mlp.up_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="825" name="self.model.layers.2.mlp.up_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="13824, 40, 1" offset="1170337912" size="1105920" /> + <output> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="826" name="self.model.layers.2.mlp.up_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="827" name="Constant_384654" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="848558152" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="828" name="Reshape_384655" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="829" name="__module.model.layers.2.mlp.up_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="830" name="__module.model.layers.2.mlp.up_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="989"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="831" name="__module.model.layers.2.mlp/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="990"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="832" name="self.model.layers.2.mlp.down_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 108, 128" offset="1171443832" size="35389440" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="833" name="Convert_384667" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="834" name="self.model.layers.2.mlp.down_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 108, 1" offset="1206833272" size="276480" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="835" name="Convert_384669" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="836" name="self.model.layers.2.mlp.down_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="837" name="self.model.layers.2.mlp.down_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="5120, 108, 1" offset="1207109752" size="1105920" /> + <output> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="838" name="self.model.layers.2.mlp.down_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="839" name="Constant_384674" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="922101848" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="840" name="Reshape_384675" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="841" name="__module.model.layers.2.mlp.down_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="842" name="__module.model.layers.2.mlp.down_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="992,hidden_states.87"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="843" name="__module.model.layers.2/aten::add/Add_1" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1003,1014,993,995,hidden_states.89,hidden_states.91"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="844" name="Constant_290081" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 5120" offset="1208215672" size="20480" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="845" name="Constant_290080" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064860" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="846" name="Constant_290078" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064864" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="847" name="__module.model.layers.3.input_layernorm/aten::pow/Power" type="Power" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1004"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="848" name="Constant_2542" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64" names="1005"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="849" name="__module.model.layers.3.input_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> + <data keep_dims="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1006,variance.13"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="850" name="Constant_290079" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064876" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="851" name="__module.model.layers.3.input_layernorm/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1007"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="852" name="__module.model.layers.3.input_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="853" name="__module.model.layers.3.input_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1008"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="854" name="__module.model.layers.3.input_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1009,1010,hidden_states.93,hidden_states.95"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="855" name="__module.model.layers.3.input_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1011,1013,hidden_states.97"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="856" name="self.model.layers.3.self_attn.q_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 128" offset="1208236152" size="13107200" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="857" name="Convert_386087" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="858" name="self.model.layers.3.self_attn.q_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 1" offset="1221343352" size="102400" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="859" name="Convert_386089" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="860" name="self.model.layers.3.self_attn.q_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="861" name="self.model.layers.3.self_attn.q_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="5120, 40, 1" offset="1221445752" size="409600" /> + <output> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="862" name="self.model.layers.3.self_attn.q_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="863" name="Constant_386094" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="792684080" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="864" name="Reshape_386095" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="865" name="__module.model.layers.3.self_attn.q_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="866" name="__module.model.layers.3.self_attn.q_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="867" name="self.model.layers.3.self_attn.q_proj.bias" type="Const" version="opset1"> + <data element_type="bf16" shape="5120" offset="1221855352" size="10240" /> + <output> + <port id="0" precision="BF16" names="self.model.layers.3.self_attn.q_proj.bias"> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="868" name="__module.model.layers.3.self_attn.q_proj/prim::PythonOp/ConvertLike_1" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="BF16"> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="869" name="__module.model.layers.3.self_attn.q_proj/prim::PythonOp/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1023,query_states.7"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="870" name="Constant_301715" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="792694336" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="871" name="__module.model.layers.3.self_attn/aten::view/Reshape" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1031"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="872" name="__module.model.layers.3.self_attn/aten::transpose/ScatterElementsUpdate" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="873" name="__module.model.layers.3.self_attn/aten::transpose/Transpose" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1032,q.7"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="874" name="__module.model.layers.3.self_attn/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1041"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="875" name="__module.model.layers.3.self_attn/aten::size/ShapeOf_3" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="876" name="__module.model.layers.3.self_attn/aten::size/Constant_3" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="877" name="__module.model.layers.3.self_attn/aten::size/Gather_3" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="1042,1047" /> + </output> + </layer> + <layer id="878" name="__module.model.layers.3.self_attn/aten::floor_divide/Divide_1" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" /> + </output> + </layer> + <layer id="879" name="__module.model.layers.3.self_attn/aten::floor_divide/Floor_1" type="Floor" version="opset1"> + <input> + <port id="0" precision="I64" /> + </input> + <output> + <port id="1" precision="I64" names="1044,1045,1049,1050" /> + </output> + </layer> + <layer id="880" name="Constant_220590" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="881" name="__module.model.layers.3.self_attn/aten::slice/Reshape_5" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="882" name="__module.model.layers.3.self_attn/aten::slice/Reshape_1" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694676" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="883" name="__module.model.layers.3.self_attn/aten::slice/Reshape_2" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="884" name="__module.model.layers.3.self_attn/aten::slice/Reshape_3" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="885" name="__module.model.layers.3.self_attn/aten::slice/Slice" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="1051,x2.13"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="886" name="Constant_290082" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1, 1" offset="792694684" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="887" name="__module.model.layers.3.self_attn/aten::neg/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1052"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="888" name="__module.model.layers.3.self_attn/aten::slice/Reshape_4" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="889" name="__module.model.layers.3.self_attn/aten::slice/Reshape_6" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="890" name="__module.model.layers.3.self_attn/aten::slice/Reshape_7" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="891" name="__module.model.layers.3.self_attn/aten::slice/Slice_1" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="1046"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="892" name="__module.model.layers.3.self_attn/aten::cat/Concat" type="Concat" version="opset1"> + <data axis="-1" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1054"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="893" name="__module.model.layers.3.self_attn/aten::mul/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1055"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="894" name="__module.model.layers.3.self_attn/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1056"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="895" name="Constant_340853" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="896" name="Constant_340846" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="12" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="897" name="Constant_340848" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="898" name="Constant_340850" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="20" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="899" name="Concat_340851" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="900" name="Broadcast_340854" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32" /> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="901" name="ReadValue_333168" type="ReadValue" version="opset6"> + <data variable_id="past_key_values.3.keypresent.3.key" variable_type="f32" variable_shape="?,8,?,128" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="past_key_values.3.key"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="902" name="Constant_325327" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="903" name="Gather_325328" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="904" name="self.model.layers.3.self_attn.k_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 128" offset="1221865592" size="2621440" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="905" name="Convert_387047" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="906" name="self.model.layers.3.self_attn.k_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 1" offset="1224487032" size="20480" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="907" name="Convert_387049" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="908" name="self.model.layers.3.self_attn.k_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="909" name="self.model.layers.3.self_attn.k_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="1024, 40, 1" offset="1224507512" size="81920" /> + <output> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="910" name="self.model.layers.3.self_attn.k_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="911" name="Constant_387054" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795418528" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="912" name="Reshape_387055" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="913" name="__module.model.layers.3.self_attn.k_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="914" name="__module.model.layers.3.self_attn.k_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="915" name="self.model.layers.3.self_attn.k_proj.bias" type="Const" version="opset1"> + <data element_type="bf16" shape="1024" offset="1224589432" size="2048" /> + <output> + <port id="0" precision="BF16" names="self.model.layers.3.self_attn.k_proj.bias"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="916" name="__module.model.layers.3.self_attn.k_proj/prim::PythonOp/ConvertLike_1" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="BF16"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="917" name="__module.model.layers.3.self_attn.k_proj/prim::PythonOp/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1026,key_states.17"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="918" name="Constant_301716" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420592" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="919" name="__module.model.layers.3.self_attn/aten::view/Reshape_1" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1034"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="920" name="__module.model.layers.3.self_attn/aten::transpose/ScatterElementsUpdate_1" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="921" name="__module.model.layers.3.self_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1035,k.7"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="922" name="__module.model.layers.3.self_attn/aten::mul/Multiply_2" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1057"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="923" name="__module.model.layers.3.self_attn/aten::size/ShapeOf_5" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="924" name="__module.model.layers.3.self_attn/aten::size/Constant_5" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="925" name="__module.model.layers.3.self_attn/aten::size/Gather_5" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="1058,1063" /> + </output> + </layer> + <layer id="926" name="__module.model.layers.3.self_attn/aten::floor_divide/Divide_3" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" /> + </output> + </layer> + <layer id="927" name="__module.model.layers.3.self_attn/aten::floor_divide/Floor_3" type="Floor" version="opset1"> + <input> + <port id="0" precision="I64" /> + </input> + <output> + <port id="1" precision="I64" names="1060,1061,1065,1066" /> + </output> + </layer> + <layer id="928" name="Constant_220591" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="929" name="__module.model.layers.3.self_attn/aten::slice/Reshape_13" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="930" name="__module.model.layers.3.self_attn/aten::slice/Reshape_9" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694676" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="931" name="__module.model.layers.3.self_attn/aten::slice/Reshape_10" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="932" name="__module.model.layers.3.self_attn/aten::slice/Reshape_11" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="933" name="__module.model.layers.3.self_attn/aten::slice/Slice_2" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="1067,x2.15"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="934" name="Constant_290083" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1, 1" offset="792694684" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="935" name="__module.model.layers.3.self_attn/aten::neg/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1068"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="936" name="__module.model.layers.3.self_attn/aten::slice/Reshape_12" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="937" name="__module.model.layers.3.self_attn/aten::slice/Reshape_14" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="938" name="__module.model.layers.3.self_attn/aten::slice/Reshape_15" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="939" name="__module.model.layers.3.self_attn/aten::slice/Slice_3" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="1062"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="940" name="__module.model.layers.3.self_attn/aten::cat/Concat_1" type="Concat" version="opset1"> + <data axis="-1" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1070"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="941" name="__module.model.layers.3.self_attn/aten::mul/Multiply_3" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1071"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="942" name="__module.model.layers.3.self_attn/aten::add/Add_1" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1072"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="943" name="__module.model.layers.3.self_attn/aten::cat/Concat_2" type="Concat" version="opset1"> + <data axis="-2" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="present.3.key"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="944" name="__module.model.layers.3.self_attn/aten::unsqueeze/Unsqueeze_2" type="Unsqueeze" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="FP32" names="1084,1085,1086"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="945" name="__module.model.layers.3.self_attn/aten::size/ShapeOf_6" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="946" name="Constant_302379" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="938477672" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="947" name="Constant_302380" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="948" name="Gather_302381" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="949" name="Constant_267942" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="795420624" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="950" name="Constant_276296" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795420632" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="951" name="Constant_276297" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="952" name="Gather_276298" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="953" name="__module.model.layers.3.self_attn/prim::ListConstruct/Concat_2" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="3" precision="I64" names="1087"> + <dim>5</dim> + </port> + </output> + </layer> + <layer id="954" name="__module.model.layers.3.self_attn/aten::expand/Broadcast" type="Broadcast" version="opset3"> + <data mode="bidirectional" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>5</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1088,hidden_states.101"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="955" name="Constant_301717" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420648" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="956" name="__module.model.layers.3.self_attn/aten::reshape/Reshape" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1092,key_states.19"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="957" name="Constant_340866" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="958" name="Constant_340859" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="12" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="959" name="Constant_340861" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="960" name="Constant_340863" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="20" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="961" name="Concat_340864" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="962" name="Broadcast_340867" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32" /> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="963" name="ReadValue_333170" type="ReadValue" version="opset6"> + <data variable_id="past_key_values.3.valuepresent.3.value" variable_type="f32" variable_shape="?,8,?,128" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="past_key_values.3.value"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="964" name="Constant_325330" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="965" name="Gather_325331" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="966" name="self.model.layers.3.self_attn.v_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 128" offset="1224591480" size="2621440" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="967" name="Convert_387057" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="968" name="self.model.layers.3.self_attn.v_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 1" offset="1227212920" size="20480" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="969" name="Convert_387059" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="970" name="self.model.layers.3.self_attn.v_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="971" name="self.model.layers.3.self_attn.v_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="1024, 40, 1" offset="1227233400" size="81920" /> + <output> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="972" name="self.model.layers.3.self_attn.v_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="973" name="Constant_387064" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795418528" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="974" name="Reshape_387065" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="975" name="__module.model.layers.3.self_attn.v_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="976" name="__module.model.layers.3.self_attn.v_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="977" name="self.model.layers.3.self_attn.v_proj.bias" type="Const" version="opset1"> + <data element_type="bf16" shape="1024" offset="1227315320" size="2048" /> + <output> + <port id="0" precision="BF16" names="self.model.layers.3.self_attn.v_proj.bias"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="978" name="__module.model.layers.3.self_attn.v_proj/prim::PythonOp/ConvertLike_1" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="BF16"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="979" name="__module.model.layers.3.self_attn.v_proj/prim::PythonOp/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1029,value_states.7"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="980" name="Constant_301718" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420592" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="981" name="__module.model.layers.3.self_attn/aten::view/Reshape_2" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1037"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="982" name="__module.model.layers.3.self_attn/aten::transpose/ScatterElementsUpdate_2" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="983" name="__module.model.layers.3.self_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1038"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="984" name="__module.model.layers.3.self_attn/aten::cat/Concat_3" type="Concat" version="opset1"> + <data axis="-2" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="present.3.value"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="985" name="__module.model.layers.3.self_attn/aten::unsqueeze/Unsqueeze_3" type="Unsqueeze" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="FP32" names="1100,1101,1102"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="986" name="__module.model.layers.3.self_attn/aten::size/ShapeOf_10" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="987" name="Constant_302103" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="988" name="__module.model.layers.3.self_attn/aten::size/Constant_11" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="989" name="__module.model.layers.3.self_attn/aten::size/Gather_11" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="1094"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="990" name="Constant_267960" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="795420624" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="991" name="Constant_276306" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795420632" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="992" name="Constant_276307" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="993" name="Gather_276308" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="994" name="__module.model.layers.3.self_attn/prim::ListConstruct/Concat_5" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="4" precision="I64" names="1103"> + <dim>5</dim> + </port> + </output> + </layer> + <layer id="995" name="__module.model.layers.3.self_attn/aten::expand/Broadcast_1" type="Broadcast" version="opset3"> + <data mode="bidirectional" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>5</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1104,hidden_states.105"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="996" name="Constant_301719" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420648" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="997" name="__module.model.layers.3.self_attn/aten::reshape/Reshape_1" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1108"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="998" name="__module.model.layers.3.self_attn/aten::slice/Reshape_60" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="999" name="ShapeOf_297838" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1000" name="Constant_297839" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694668" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1001" name="Constant_297840" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="1002" name="Gather_297841" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1003" name="ShapeOf_297842" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1004" name="Constant_297843" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694668" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1005" name="Constant_297844" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="1006" name="Gather_297845" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1007" name="Add_297846" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64" names="1109"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1008" name="__module.model.layers.3.self_attn/aten::slice/Reshape_62" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1009" name="__module.model.layers.3.self_attn/aten::slice/Reshape_63" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1010" name="__module.model.layers.3.self_attn/aten::slice/Slice_15" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="1113"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="1011" name="__module.model.layers.3.self_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> + <data causal="false" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="1114,attn_output.13"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1012" name="__module.model.layers.3.self_attn/aten::transpose/ScatterElementsUpdate_3" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1013" name="__module.model.layers.3.self_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1115"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1014" name="Constant_301720" type="Const" version="opset1"> + <data element_type="i64" shape="3" offset="798146608" size="24" /> + <output> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="1015" name="__module.model.layers.3.self_attn/aten::view/Reshape_3" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>3</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1118"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="1016" name="self.model.layers.3.self_attn.o_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 128" offset="1227317368" size="13107200" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1017" name="Convert_386097" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1018" name="self.model.layers.3.self_attn.o_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 1" offset="1240424568" size="102400" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1019" name="Convert_386099" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1020" name="self.model.layers.3.self_attn.o_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1021" name="self.model.layers.3.self_attn.o_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="5120, 40, 1" offset="1240526968" size="409600" /> + <output> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1022" name="self.model.layers.3.self_attn.o_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1023" name="Constant_386104" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="792684080" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="1024" name="Reshape_386105" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="1025" name="__module.model.layers.3.self_attn.o_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="1026" name="__module.model.layers.3.self_attn.o_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1120,1122,hidden_states.107"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="1027" name="__module.model.layers.3/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1125,1127,1138,hidden_states.109,hidden_states.111"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="1028" name="Constant_290087" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 5120" offset="1240936568" size="20480" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="1029" name="Constant_290086" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064860" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1030" name="Constant_290084" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064864" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1031" name="__module.model.layers.3.post_attention_layernorm/aten::pow/Power" type="Power" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1128"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="1032" name="Constant_3140" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64" names="1129"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1033" name="__module.model.layers.3.post_attention_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> + <data keep_dims="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1130,variance.15"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1034" name="Constant_290085" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064876" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1035" name="__module.model.layers.3.post_attention_layernorm/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1131"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1036" name="__module.model.layers.3.post_attention_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1037" name="__module.model.layers.3.post_attention_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1132"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1038" name="__module.model.layers.3.post_attention_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1133,1134,hidden_states.113,hidden_states.115"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="1039" name="__module.model.layers.3.post_attention_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1135,1137"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="1040" name="self.model.layers.3.mlp.gate_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 128" offset="1240957048" size="35389440" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1041" name="Convert_384687" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1042" name="self.model.layers.3.mlp.gate_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 1" offset="1276346488" size="276480" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1043" name="Convert_384689" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1044" name="self.model.layers.3.mlp.gate_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1045" name="self.model.layers.3.mlp.gate_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="13824, 40, 1" offset="1276622968" size="1105920" /> + <output> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1046" name="self.model.layers.3.mlp.gate_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1047" name="Constant_384694" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="848558152" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="1048" name="Reshape_384695" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="1049" name="__module.model.layers.3.mlp.gate_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="1050" name="__module.model.layers.3.mlp.gate_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1143,input.7"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="1051" name="__module.model.layers.3.mlp.act_fn/aten::silu/Swish" type="Swish" version="opset4"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="1144"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="1052" name="self.model.layers.3.mlp.up_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 128" offset="1277728888" size="35389440" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1053" name="Convert_384677" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1054" name="self.model.layers.3.mlp.up_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 1" offset="1313118328" size="276480" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1055" name="Convert_384679" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1056" name="self.model.layers.3.mlp.up_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1057" name="self.model.layers.3.mlp.up_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="13824, 40, 1" offset="1313394808" size="1105920" /> + <output> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1058" name="self.model.layers.3.mlp.up_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1059" name="Constant_384684" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="848558152" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="1060" name="Reshape_384685" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="1061" name="__module.model.layers.3.mlp.up_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="1062" name="__module.model.layers.3.mlp.up_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1146"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="1063" name="__module.model.layers.3.mlp/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1147"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="1064" name="self.model.layers.3.mlp.down_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 108, 128" offset="1314500728" size="35389440" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1065" name="Convert_384697" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1066" name="self.model.layers.3.mlp.down_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 108, 1" offset="1349890168" size="276480" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1067" name="Convert_384699" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1068" name="self.model.layers.3.mlp.down_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1069" name="self.model.layers.3.mlp.down_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="5120, 108, 1" offset="1350166648" size="1105920" /> + <output> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1070" name="self.model.layers.3.mlp.down_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1071" name="Constant_384704" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="922101848" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="1072" name="Reshape_384705" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="1073" name="__module.model.layers.3.mlp.down_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="1074" name="__module.model.layers.3.mlp.down_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1149,hidden_states.117"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="1075" name="__module.model.layers.3/aten::add/Add_1" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1150,1152,1160,1171,hidden_states.119,hidden_states.121"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="1076" name="Constant_290091" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 5120" offset="1351272568" size="20480" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="1077" name="Constant_290090" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064860" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1078" name="Constant_290088" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064864" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1079" name="__module.model.layers.4.input_layernorm/aten::pow/Power" type="Power" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1161"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="1080" name="Constant_3214" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64" names="1162"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1081" name="__module.model.layers.4.input_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> + <data keep_dims="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1163,variance.17"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1082" name="Constant_290089" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064876" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1083" name="__module.model.layers.4.input_layernorm/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1164"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1084" name="__module.model.layers.4.input_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1085" name="__module.model.layers.4.input_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1165"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1086" name="__module.model.layers.4.input_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1166,1167,hidden_states.123,hidden_states.125"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="1087" name="__module.model.layers.4.input_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1168,1170,hidden_states.127"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="1088" name="self.model.layers.4.self_attn.q_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 128" offset="1351293048" size="13107200" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1089" name="Convert_386107" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1090" name="self.model.layers.4.self_attn.q_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 1" offset="1364400248" size="102400" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1091" name="Convert_386109" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1092" name="self.model.layers.4.self_attn.q_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1093" name="self.model.layers.4.self_attn.q_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="5120, 40, 1" offset="1364502648" size="409600" /> + <output> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1094" name="self.model.layers.4.self_attn.q_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1095" name="Constant_386114" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="792684080" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="1096" name="Reshape_386115" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="1097" name="__module.model.layers.4.self_attn.q_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="1098" name="__module.model.layers.4.self_attn.q_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="1099" name="self.model.layers.4.self_attn.q_proj.bias" type="Const" version="opset1"> + <data element_type="bf16" shape="5120" offset="1364912248" size="10240" /> + <output> + <port id="0" precision="BF16" names="self.model.layers.4.self_attn.q_proj.bias"> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="1100" name="__module.model.layers.4.self_attn.q_proj/prim::PythonOp/ConvertLike_1" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="BF16"> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="1101" name="__module.model.layers.4.self_attn.q_proj/prim::PythonOp/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1180,query_states.9"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="1102" name="Constant_301721" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="792694336" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1103" name="__module.model.layers.4.self_attn/aten::view/Reshape" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1188"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1104" name="__module.model.layers.4.self_attn/aten::transpose/ScatterElementsUpdate" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1105" name="__module.model.layers.4.self_attn/aten::transpose/Transpose" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1189,q.9"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1106" name="__module.model.layers.4.self_attn/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1198"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1107" name="__module.model.layers.4.self_attn/aten::size/ShapeOf_3" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1108" name="__module.model.layers.4.self_attn/aten::size/Constant_3" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="1109" name="__module.model.layers.4.self_attn/aten::size/Gather_3" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="1199,1204" /> + </output> + </layer> + <layer id="1110" name="__module.model.layers.4.self_attn/aten::floor_divide/Divide_1" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" /> + </output> + </layer> + <layer id="1111" name="__module.model.layers.4.self_attn/aten::floor_divide/Floor_1" type="Floor" version="opset1"> + <input> + <port id="0" precision="I64" /> + </input> + <output> + <port id="1" precision="I64" names="1201,1202,1206,1207" /> + </output> + </layer> + <layer id="1112" name="Constant_220605" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1113" name="__module.model.layers.4.self_attn/aten::slice/Reshape_5" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1114" name="__module.model.layers.4.self_attn/aten::slice/Reshape_1" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694676" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1115" name="__module.model.layers.4.self_attn/aten::slice/Reshape_2" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1116" name="__module.model.layers.4.self_attn/aten::slice/Reshape_3" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1117" name="__module.model.layers.4.self_attn/aten::slice/Slice" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="1208,x2.17"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="1118" name="Constant_290092" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1, 1" offset="792694684" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1119" name="__module.model.layers.4.self_attn/aten::neg/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1209"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="1120" name="__module.model.layers.4.self_attn/aten::slice/Reshape_4" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1121" name="__module.model.layers.4.self_attn/aten::slice/Reshape_6" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1122" name="__module.model.layers.4.self_attn/aten::slice/Reshape_7" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1123" name="__module.model.layers.4.self_attn/aten::slice/Slice_1" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="1203"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="1124" name="__module.model.layers.4.self_attn/aten::cat/Concat" type="Concat" version="opset1"> + <data axis="-1" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1211"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1125" name="__module.model.layers.4.self_attn/aten::mul/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1212"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1126" name="__module.model.layers.4.self_attn/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1213"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1127" name="Constant_340879" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="1128" name="Constant_340872" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="12" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1129" name="Constant_340874" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1130" name="Constant_340876" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="20" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1131" name="Concat_340877" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1132" name="Broadcast_340880" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32" /> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1133" name="ReadValue_333212" type="ReadValue" version="opset6"> + <data variable_id="past_key_values.4.keypresent.4.key" variable_type="f32" variable_shape="?,8,?,128" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="past_key_values.4.key"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1134" name="Constant_325333" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="1135" name="Gather_325334" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1136" name="self.model.layers.4.self_attn.k_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 128" offset="1364922488" size="2621440" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1137" name="Convert_387067" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1138" name="self.model.layers.4.self_attn.k_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 1" offset="1367543928" size="20480" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1139" name="Convert_387069" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1140" name="self.model.layers.4.self_attn.k_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1141" name="self.model.layers.4.self_attn.k_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="1024, 40, 1" offset="1367564408" size="81920" /> + <output> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1142" name="self.model.layers.4.self_attn.k_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1143" name="Constant_387074" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795418528" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="1144" name="Reshape_387075" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="1145" name="__module.model.layers.4.self_attn.k_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="1146" name="__module.model.layers.4.self_attn.k_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="1147" name="self.model.layers.4.self_attn.k_proj.bias" type="Const" version="opset1"> + <data element_type="bf16" shape="1024" offset="1367646328" size="2048" /> + <output> + <port id="0" precision="BF16" names="self.model.layers.4.self_attn.k_proj.bias"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="1148" name="__module.model.layers.4.self_attn.k_proj/prim::PythonOp/ConvertLike_1" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="BF16"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="1149" name="__module.model.layers.4.self_attn.k_proj/prim::PythonOp/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1183,key_states.21"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="1150" name="Constant_301722" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420592" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1151" name="__module.model.layers.4.self_attn/aten::view/Reshape_1" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1191"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1152" name="__module.model.layers.4.self_attn/aten::transpose/ScatterElementsUpdate_1" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1153" name="__module.model.layers.4.self_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1192,k.9"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1154" name="__module.model.layers.4.self_attn/aten::mul/Multiply_2" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1214"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1155" name="__module.model.layers.4.self_attn/aten::size/ShapeOf_5" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1156" name="__module.model.layers.4.self_attn/aten::size/Constant_5" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="1157" name="__module.model.layers.4.self_attn/aten::size/Gather_5" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="1215,1220" /> + </output> + </layer> + <layer id="1158" name="__module.model.layers.4.self_attn/aten::floor_divide/Divide_3" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" /> + </output> + </layer> + <layer id="1159" name="__module.model.layers.4.self_attn/aten::floor_divide/Floor_3" type="Floor" version="opset1"> + <input> + <port id="0" precision="I64" /> + </input> + <output> + <port id="1" precision="I64" names="1217,1218,1222,1223" /> + </output> + </layer> + <layer id="1160" name="Constant_220606" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1161" name="__module.model.layers.4.self_attn/aten::slice/Reshape_13" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1162" name="__module.model.layers.4.self_attn/aten::slice/Reshape_9" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694676" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1163" name="__module.model.layers.4.self_attn/aten::slice/Reshape_10" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1164" name="__module.model.layers.4.self_attn/aten::slice/Reshape_11" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1165" name="__module.model.layers.4.self_attn/aten::slice/Slice_2" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="1224,x2.19"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="1166" name="Constant_290093" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1, 1" offset="792694684" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1167" name="__module.model.layers.4.self_attn/aten::neg/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1225"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="1168" name="__module.model.layers.4.self_attn/aten::slice/Reshape_12" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1169" name="__module.model.layers.4.self_attn/aten::slice/Reshape_14" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1170" name="__module.model.layers.4.self_attn/aten::slice/Reshape_15" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1171" name="__module.model.layers.4.self_attn/aten::slice/Slice_3" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="1219"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="1172" name="__module.model.layers.4.self_attn/aten::cat/Concat_1" type="Concat" version="opset1"> + <data axis="-1" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1227"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1173" name="__module.model.layers.4.self_attn/aten::mul/Multiply_3" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1228"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1174" name="__module.model.layers.4.self_attn/aten::add/Add_1" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1229"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1175" name="__module.model.layers.4.self_attn/aten::cat/Concat_2" type="Concat" version="opset1"> + <data axis="-2" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="present.4.key"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1176" name="__module.model.layers.4.self_attn/aten::unsqueeze/Unsqueeze_2" type="Unsqueeze" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="FP32" names="1241,1242,1243"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1177" name="__module.model.layers.4.self_attn/aten::size/ShapeOf_6" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1178" name="Constant_302384" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="938477672" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="1179" name="Constant_302385" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="1180" name="Gather_302386" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="1181" name="Constant_267978" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="795420624" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1182" name="Constant_276331" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795420632" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="1183" name="Constant_276332" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="1184" name="Gather_276333" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="1185" name="__module.model.layers.4.self_attn/prim::ListConstruct/Concat_2" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="3" precision="I64" names="1244"> + <dim>5</dim> + </port> + </output> + </layer> + <layer id="1186" name="__module.model.layers.4.self_attn/aten::expand/Broadcast" type="Broadcast" version="opset3"> + <data mode="bidirectional" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>5</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1245,hidden_states.131"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1187" name="Constant_301723" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420648" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1188" name="__module.model.layers.4.self_attn/aten::reshape/Reshape" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1249,key_states.23"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1189" name="Constant_340892" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="1190" name="Constant_340885" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="12" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1191" name="Constant_340887" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1192" name="Constant_340889" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="20" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1193" name="Concat_340890" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1194" name="Broadcast_340893" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32" /> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1195" name="ReadValue_333214" type="ReadValue" version="opset6"> + <data variable_id="past_key_values.4.valuepresent.4.value" variable_type="f32" variable_shape="?,8,?,128" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="past_key_values.4.value"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1196" name="Constant_325336" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="1197" name="Gather_325337" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1198" name="self.model.layers.4.self_attn.v_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 128" offset="1367648376" size="2621440" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1199" name="Convert_387077" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1200" name="self.model.layers.4.self_attn.v_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 1" offset="1370269816" size="20480" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1201" name="Convert_387079" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1202" name="self.model.layers.4.self_attn.v_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1203" name="self.model.layers.4.self_attn.v_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="1024, 40, 1" offset="1370290296" size="81920" /> + <output> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1204" name="self.model.layers.4.self_attn.v_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1205" name="Constant_387084" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795418528" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="1206" name="Reshape_387085" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="1207" name="__module.model.layers.4.self_attn.v_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="1208" name="__module.model.layers.4.self_attn.v_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="1209" name="self.model.layers.4.self_attn.v_proj.bias" type="Const" version="opset1"> + <data element_type="bf16" shape="1024" offset="1370372216" size="2048" /> + <output> + <port id="0" precision="BF16" names="self.model.layers.4.self_attn.v_proj.bias"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="1210" name="__module.model.layers.4.self_attn.v_proj/prim::PythonOp/ConvertLike_1" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="BF16"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="1211" name="__module.model.layers.4.self_attn.v_proj/prim::PythonOp/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1186,value_states.9"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="1212" name="Constant_301724" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420592" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1213" name="__module.model.layers.4.self_attn/aten::view/Reshape_2" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1194"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1214" name="__module.model.layers.4.self_attn/aten::transpose/ScatterElementsUpdate_2" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1215" name="__module.model.layers.4.self_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1195"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1216" name="__module.model.layers.4.self_attn/aten::cat/Concat_3" type="Concat" version="opset1"> + <data axis="-2" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="present.4.value"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1217" name="__module.model.layers.4.self_attn/aten::unsqueeze/Unsqueeze_3" type="Unsqueeze" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="FP32" names="1257,1258,1259"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1218" name="__module.model.layers.4.self_attn/aten::size/ShapeOf_10" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1219" name="Constant_302109" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1220" name="__module.model.layers.4.self_attn/aten::size/Constant_11" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="1221" name="__module.model.layers.4.self_attn/aten::size/Gather_11" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="1251"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1222" name="Constant_267996" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="795420624" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1223" name="Constant_276341" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795420632" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="1224" name="Constant_276342" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="1225" name="Gather_276343" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="1226" name="__module.model.layers.4.self_attn/prim::ListConstruct/Concat_5" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="4" precision="I64" names="1260"> + <dim>5</dim> + </port> + </output> + </layer> + <layer id="1227" name="__module.model.layers.4.self_attn/aten::expand/Broadcast_1" type="Broadcast" version="opset3"> + <data mode="bidirectional" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>5</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1261,hidden_states.135"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1228" name="Constant_301725" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420648" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1229" name="__module.model.layers.4.self_attn/aten::reshape/Reshape_1" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1265"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1230" name="__module.model.layers.4.self_attn/aten::slice/Reshape_60" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1231" name="ShapeOf_297924" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1232" name="Constant_297925" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694668" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1233" name="Constant_297926" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="1234" name="Gather_297927" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1235" name="ShapeOf_297928" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1236" name="Constant_297929" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694668" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1237" name="Constant_297930" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="1238" name="Gather_297931" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1239" name="Add_297932" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64" names="1266"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1240" name="__module.model.layers.4.self_attn/aten::slice/Reshape_62" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1241" name="__module.model.layers.4.self_attn/aten::slice/Reshape_63" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1242" name="__module.model.layers.4.self_attn/aten::slice/Slice_15" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="1270"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="1243" name="__module.model.layers.4.self_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> + <data causal="false" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="1271,attn_output.17"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1244" name="__module.model.layers.4.self_attn/aten::transpose/ScatterElementsUpdate_3" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1245" name="__module.model.layers.4.self_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1272"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1246" name="Constant_301726" type="Const" version="opset1"> + <data element_type="i64" shape="3" offset="798146608" size="24" /> + <output> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="1247" name="__module.model.layers.4.self_attn/aten::view/Reshape_3" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>3</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1275"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="1248" name="self.model.layers.4.self_attn.o_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 128" offset="1370374264" size="13107200" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1249" name="Convert_386117" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1250" name="self.model.layers.4.self_attn.o_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 1" offset="1383481464" size="102400" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1251" name="Convert_386119" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1252" name="self.model.layers.4.self_attn.o_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1253" name="self.model.layers.4.self_attn.o_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="5120, 40, 1" offset="1383583864" size="409600" /> + <output> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1254" name="self.model.layers.4.self_attn.o_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1255" name="Constant_386124" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="792684080" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="1256" name="Reshape_386125" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="1257" name="__module.model.layers.4.self_attn.o_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="1258" name="__module.model.layers.4.self_attn.o_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1277,1279,hidden_states.137"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="1259" name="__module.model.layers.4/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1282,1284,1295,hidden_states.139,hidden_states.141"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="1260" name="Constant_290097" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 5120" offset="1383993464" size="20480" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="1261" name="Constant_290096" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064860" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1262" name="Constant_290094" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064864" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1263" name="__module.model.layers.4.post_attention_layernorm/aten::pow/Power" type="Power" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1285"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="1264" name="Constant_3812" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64" names="1286"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1265" name="__module.model.layers.4.post_attention_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> + <data keep_dims="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1287,variance.19"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1266" name="Constant_290095" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064876" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1267" name="__module.model.layers.4.post_attention_layernorm/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1288"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1268" name="__module.model.layers.4.post_attention_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1269" name="__module.model.layers.4.post_attention_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1289"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1270" name="__module.model.layers.4.post_attention_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1290,1291,hidden_states.143,hidden_states.145"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="1271" name="__module.model.layers.4.post_attention_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1292,1294"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="1272" name="self.model.layers.4.mlp.gate_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 128" offset="1384013944" size="35389440" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1273" name="Convert_384717" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1274" name="self.model.layers.4.mlp.gate_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 1" offset="1419403384" size="276480" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1275" name="Convert_384719" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1276" name="self.model.layers.4.mlp.gate_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1277" name="self.model.layers.4.mlp.gate_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="13824, 40, 1" offset="1419679864" size="1105920" /> + <output> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1278" name="self.model.layers.4.mlp.gate_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1279" name="Constant_384724" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="848558152" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="1280" name="Reshape_384725" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="1281" name="__module.model.layers.4.mlp.gate_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="1282" name="__module.model.layers.4.mlp.gate_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1300,input.9"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="1283" name="__module.model.layers.4.mlp.act_fn/aten::silu/Swish" type="Swish" version="opset4"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="1301"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="1284" name="self.model.layers.4.mlp.up_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 128" offset="1420785784" size="35389440" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1285" name="Convert_384707" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1286" name="self.model.layers.4.mlp.up_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 1" offset="1456175224" size="276480" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1287" name="Convert_384709" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1288" name="self.model.layers.4.mlp.up_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1289" name="self.model.layers.4.mlp.up_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="13824, 40, 1" offset="1456451704" size="1105920" /> + <output> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1290" name="self.model.layers.4.mlp.up_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1291" name="Constant_384714" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="848558152" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="1292" name="Reshape_384715" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="1293" name="__module.model.layers.4.mlp.up_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="1294" name="__module.model.layers.4.mlp.up_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1303"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="1295" name="__module.model.layers.4.mlp/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1304"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="1296" name="self.model.layers.4.mlp.down_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 108, 128" offset="1457557624" size="35389440" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1297" name="Convert_384727" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1298" name="self.model.layers.4.mlp.down_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 108, 1" offset="1492947064" size="276480" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1299" name="Convert_384729" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1300" name="self.model.layers.4.mlp.down_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1301" name="self.model.layers.4.mlp.down_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="5120, 108, 1" offset="1493223544" size="1105920" /> + <output> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1302" name="self.model.layers.4.mlp.down_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1303" name="Constant_384734" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="922101848" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="1304" name="Reshape_384735" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="1305" name="__module.model.layers.4.mlp.down_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="1306" name="__module.model.layers.4.mlp.down_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1306,hidden_states.147"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="1307" name="__module.model.layers.4/aten::add/Add_1" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1307,1309,1317,1328,hidden_states.149,hidden_states.151"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="1308" name="Constant_290101" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 5120" offset="1494329464" size="20480" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="1309" name="Constant_290100" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064860" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1310" name="Constant_290098" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064864" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1311" name="__module.model.layers.5.input_layernorm/aten::pow/Power" type="Power" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1318"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="1312" name="Constant_3886" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64" names="1319"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1313" name="__module.model.layers.5.input_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> + <data keep_dims="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1320,variance.21"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1314" name="Constant_290099" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064876" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1315" name="__module.model.layers.5.input_layernorm/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1321"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1316" name="__module.model.layers.5.input_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1317" name="__module.model.layers.5.input_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1322"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1318" name="__module.model.layers.5.input_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1323,1324,hidden_states.153,hidden_states.155"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="1319" name="__module.model.layers.5.input_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1325,1327,hidden_states.157"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="1320" name="self.model.layers.5.self_attn.q_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 128" offset="1494349944" size="13107200" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1321" name="Convert_386127" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1322" name="self.model.layers.5.self_attn.q_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 1" offset="1507457144" size="102400" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1323" name="Convert_386129" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1324" name="self.model.layers.5.self_attn.q_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1325" name="self.model.layers.5.self_attn.q_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="5120, 40, 1" offset="1507559544" size="409600" /> + <output> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1326" name="self.model.layers.5.self_attn.q_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1327" name="Constant_386134" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="792684080" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="1328" name="Reshape_386135" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="1329" name="__module.model.layers.5.self_attn.q_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="1330" name="__module.model.layers.5.self_attn.q_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="1331" name="self.model.layers.5.self_attn.q_proj.bias" type="Const" version="opset1"> + <data element_type="bf16" shape="5120" offset="1507969144" size="10240" /> + <output> + <port id="0" precision="BF16" names="self.model.layers.5.self_attn.q_proj.bias"> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="1332" name="__module.model.layers.5.self_attn.q_proj/prim::PythonOp/ConvertLike_1" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="BF16"> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="1333" name="__module.model.layers.5.self_attn.q_proj/prim::PythonOp/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1337,query_states.11"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="1334" name="Constant_301727" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="792694336" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1335" name="__module.model.layers.5.self_attn/aten::view/Reshape" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1345"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1336" name="__module.model.layers.5.self_attn/aten::transpose/ScatterElementsUpdate" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1337" name="__module.model.layers.5.self_attn/aten::transpose/Transpose" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1346,q.11"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1338" name="__module.model.layers.5.self_attn/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1355"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1339" name="__module.model.layers.5.self_attn/aten::size/ShapeOf_3" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1340" name="__module.model.layers.5.self_attn/aten::size/Constant_3" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="1341" name="__module.model.layers.5.self_attn/aten::size/Gather_3" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="1356,1361" /> + </output> + </layer> + <layer id="1342" name="__module.model.layers.5.self_attn/aten::floor_divide/Divide_1" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" /> + </output> + </layer> + <layer id="1343" name="__module.model.layers.5.self_attn/aten::floor_divide/Floor_1" type="Floor" version="opset1"> + <input> + <port id="0" precision="I64" /> + </input> + <output> + <port id="1" precision="I64" names="1358,1359,1363,1364" /> + </output> + </layer> + <layer id="1344" name="Constant_220620" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1345" name="__module.model.layers.5.self_attn/aten::slice/Reshape_5" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1346" name="__module.model.layers.5.self_attn/aten::slice/Reshape_1" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694676" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1347" name="__module.model.layers.5.self_attn/aten::slice/Reshape_2" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1348" name="__module.model.layers.5.self_attn/aten::slice/Reshape_3" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1349" name="__module.model.layers.5.self_attn/aten::slice/Slice" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="1365,x2.21"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="1350" name="Constant_290102" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1, 1" offset="792694684" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1351" name="__module.model.layers.5.self_attn/aten::neg/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1366"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="1352" name="__module.model.layers.5.self_attn/aten::slice/Reshape_4" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1353" name="__module.model.layers.5.self_attn/aten::slice/Reshape_6" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1354" name="__module.model.layers.5.self_attn/aten::slice/Reshape_7" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1355" name="__module.model.layers.5.self_attn/aten::slice/Slice_1" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="1360"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="1356" name="__module.model.layers.5.self_attn/aten::cat/Concat" type="Concat" version="opset1"> + <data axis="-1" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1368"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1357" name="__module.model.layers.5.self_attn/aten::mul/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1369"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1358" name="__module.model.layers.5.self_attn/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1370"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1359" name="Constant_340905" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="1360" name="Constant_340898" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="12" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1361" name="Constant_340900" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1362" name="Constant_340902" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="20" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1363" name="Concat_340903" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1364" name="Broadcast_340906" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32" /> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1365" name="ReadValue_333248" type="ReadValue" version="opset6"> + <data variable_id="past_key_values.5.keypresent.5.key" variable_type="f32" variable_shape="?,8,?,128" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="past_key_values.5.key"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1366" name="Constant_325339" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="1367" name="Gather_325340" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1368" name="self.model.layers.5.self_attn.k_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 128" offset="1507979384" size="2621440" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1369" name="Convert_387087" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1370" name="self.model.layers.5.self_attn.k_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 1" offset="1510600824" size="20480" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1371" name="Convert_387089" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1372" name="self.model.layers.5.self_attn.k_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1373" name="self.model.layers.5.self_attn.k_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="1024, 40, 1" offset="1510621304" size="81920" /> + <output> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1374" name="self.model.layers.5.self_attn.k_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1375" name="Constant_387094" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795418528" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="1376" name="Reshape_387095" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="1377" name="__module.model.layers.5.self_attn.k_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="1378" name="__module.model.layers.5.self_attn.k_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="1379" name="self.model.layers.5.self_attn.k_proj.bias" type="Const" version="opset1"> + <data element_type="bf16" shape="1024" offset="1510703224" size="2048" /> + <output> + <port id="0" precision="BF16" names="self.model.layers.5.self_attn.k_proj.bias"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="1380" name="__module.model.layers.5.self_attn.k_proj/prim::PythonOp/ConvertLike_1" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="BF16"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="1381" name="__module.model.layers.5.self_attn.k_proj/prim::PythonOp/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1340,key_states.25"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="1382" name="Constant_301728" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420592" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1383" name="__module.model.layers.5.self_attn/aten::view/Reshape_1" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1348"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1384" name="__module.model.layers.5.self_attn/aten::transpose/ScatterElementsUpdate_1" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1385" name="__module.model.layers.5.self_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1349,k.11"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1386" name="__module.model.layers.5.self_attn/aten::mul/Multiply_2" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1371"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1387" name="__module.model.layers.5.self_attn/aten::size/ShapeOf_5" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1388" name="__module.model.layers.5.self_attn/aten::size/Constant_5" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="1389" name="__module.model.layers.5.self_attn/aten::size/Gather_5" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="1372,1377" /> + </output> + </layer> + <layer id="1390" name="__module.model.layers.5.self_attn/aten::floor_divide/Divide_3" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" /> + </output> + </layer> + <layer id="1391" name="__module.model.layers.5.self_attn/aten::floor_divide/Floor_3" type="Floor" version="opset1"> + <input> + <port id="0" precision="I64" /> + </input> + <output> + <port id="1" precision="I64" names="1374,1375,1379,1380" /> + </output> + </layer> + <layer id="1392" name="Constant_220621" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1393" name="__module.model.layers.5.self_attn/aten::slice/Reshape_13" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1394" name="__module.model.layers.5.self_attn/aten::slice/Reshape_9" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694676" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1395" name="__module.model.layers.5.self_attn/aten::slice/Reshape_10" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1396" name="__module.model.layers.5.self_attn/aten::slice/Reshape_11" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1397" name="__module.model.layers.5.self_attn/aten::slice/Slice_2" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="1381,x2.23"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="1398" name="Constant_290103" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1, 1" offset="792694684" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1399" name="__module.model.layers.5.self_attn/aten::neg/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1382"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="1400" name="__module.model.layers.5.self_attn/aten::slice/Reshape_12" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1401" name="__module.model.layers.5.self_attn/aten::slice/Reshape_14" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1402" name="__module.model.layers.5.self_attn/aten::slice/Reshape_15" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1403" name="__module.model.layers.5.self_attn/aten::slice/Slice_3" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="1376"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="1404" name="__module.model.layers.5.self_attn/aten::cat/Concat_1" type="Concat" version="opset1"> + <data axis="-1" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1384"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1405" name="__module.model.layers.5.self_attn/aten::mul/Multiply_3" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1385"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1406" name="__module.model.layers.5.self_attn/aten::add/Add_1" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1386"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1407" name="__module.model.layers.5.self_attn/aten::cat/Concat_2" type="Concat" version="opset1"> + <data axis="-2" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="present.5.key"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1408" name="__module.model.layers.5.self_attn/aten::unsqueeze/Unsqueeze_2" type="Unsqueeze" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="FP32" names="1398,1399,1400"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1409" name="__module.model.layers.5.self_attn/aten::size/ShapeOf_6" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1410" name="Constant_302389" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="938477672" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="1411" name="Constant_302390" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="1412" name="Gather_302391" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="1413" name="Constant_268014" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="795420624" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1414" name="Constant_276366" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795420632" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="1415" name="Constant_276367" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="1416" name="Gather_276368" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="1417" name="__module.model.layers.5.self_attn/prim::ListConstruct/Concat_2" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="3" precision="I64" names="1401"> + <dim>5</dim> + </port> + </output> + </layer> + <layer id="1418" name="__module.model.layers.5.self_attn/aten::expand/Broadcast" type="Broadcast" version="opset3"> + <data mode="bidirectional" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>5</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1402,hidden_states.161"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1419" name="Constant_301729" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420648" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1420" name="__module.model.layers.5.self_attn/aten::reshape/Reshape" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1406,key_states.27"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1421" name="Constant_340918" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="1422" name="Constant_340911" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="12" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1423" name="Constant_340913" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1424" name="Constant_340915" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="20" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1425" name="Concat_340916" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1426" name="Broadcast_340919" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32" /> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1427" name="ReadValue_333250" type="ReadValue" version="opset6"> + <data variable_id="past_key_values.5.valuepresent.5.value" variable_type="f32" variable_shape="?,8,?,128" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="past_key_values.5.value"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1428" name="Constant_325342" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="1429" name="Gather_325343" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1430" name="self.model.layers.5.self_attn.v_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 128" offset="1510705272" size="2621440" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1431" name="Convert_387097" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1432" name="self.model.layers.5.self_attn.v_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 1" offset="1513326712" size="20480" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1433" name="Convert_387099" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1434" name="self.model.layers.5.self_attn.v_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1435" name="self.model.layers.5.self_attn.v_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="1024, 40, 1" offset="1513347192" size="81920" /> + <output> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1436" name="self.model.layers.5.self_attn.v_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1437" name="Constant_387104" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795418528" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="1438" name="Reshape_387105" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="1439" name="__module.model.layers.5.self_attn.v_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="1440" name="__module.model.layers.5.self_attn.v_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="1441" name="self.model.layers.5.self_attn.v_proj.bias" type="Const" version="opset1"> + <data element_type="bf16" shape="1024" offset="1513429112" size="2048" /> + <output> + <port id="0" precision="BF16" names="self.model.layers.5.self_attn.v_proj.bias"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="1442" name="__module.model.layers.5.self_attn.v_proj/prim::PythonOp/ConvertLike_1" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="BF16"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="1443" name="__module.model.layers.5.self_attn.v_proj/prim::PythonOp/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1343,value_states.11"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="1444" name="Constant_301730" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420592" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1445" name="__module.model.layers.5.self_attn/aten::view/Reshape_2" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1351"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1446" name="__module.model.layers.5.self_attn/aten::transpose/ScatterElementsUpdate_2" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1447" name="__module.model.layers.5.self_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1352"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1448" name="__module.model.layers.5.self_attn/aten::cat/Concat_3" type="Concat" version="opset1"> + <data axis="-2" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="present.5.value"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1449" name="__module.model.layers.5.self_attn/aten::unsqueeze/Unsqueeze_3" type="Unsqueeze" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="FP32" names="1414,1415,1416"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1450" name="__module.model.layers.5.self_attn/aten::size/ShapeOf_10" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1451" name="Constant_302115" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1452" name="__module.model.layers.5.self_attn/aten::size/Constant_11" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="1453" name="__module.model.layers.5.self_attn/aten::size/Gather_11" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="1408"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1454" name="Constant_268032" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="795420624" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1455" name="Constant_276376" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795420632" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="1456" name="Constant_276377" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="1457" name="Gather_276378" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="1458" name="__module.model.layers.5.self_attn/prim::ListConstruct/Concat_5" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="4" precision="I64" names="1417"> + <dim>5</dim> + </port> + </output> + </layer> + <layer id="1459" name="__module.model.layers.5.self_attn/aten::expand/Broadcast_1" type="Broadcast" version="opset3"> + <data mode="bidirectional" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>5</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1418,hidden_states.165"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1460" name="Constant_301731" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420648" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1461" name="__module.model.layers.5.self_attn/aten::reshape/Reshape_1" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1422"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1462" name="__module.model.layers.5.self_attn/aten::slice/Reshape_60" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1463" name="ShapeOf_298010" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1464" name="Constant_298011" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694668" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1465" name="Constant_298012" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="1466" name="Gather_298013" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1467" name="ShapeOf_298014" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1468" name="Constant_298015" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694668" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1469" name="Constant_298016" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="1470" name="Gather_298017" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1471" name="Add_298018" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64" names="1423"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1472" name="__module.model.layers.5.self_attn/aten::slice/Reshape_62" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1473" name="__module.model.layers.5.self_attn/aten::slice/Reshape_63" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1474" name="__module.model.layers.5.self_attn/aten::slice/Slice_15" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="1427"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="1475" name="__module.model.layers.5.self_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> + <data causal="false" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="1428,attn_output.21"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1476" name="__module.model.layers.5.self_attn/aten::transpose/ScatterElementsUpdate_3" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1477" name="__module.model.layers.5.self_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1429"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1478" name="Constant_301732" type="Const" version="opset1"> + <data element_type="i64" shape="3" offset="798146608" size="24" /> + <output> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="1479" name="__module.model.layers.5.self_attn/aten::view/Reshape_3" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>3</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1432"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="1480" name="self.model.layers.5.self_attn.o_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 128" offset="1513431160" size="13107200" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1481" name="Convert_386137" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1482" name="self.model.layers.5.self_attn.o_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 1" offset="1526538360" size="102400" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1483" name="Convert_386139" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1484" name="self.model.layers.5.self_attn.o_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1485" name="self.model.layers.5.self_attn.o_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="5120, 40, 1" offset="1526640760" size="409600" /> + <output> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1486" name="self.model.layers.5.self_attn.o_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1487" name="Constant_386144" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="792684080" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="1488" name="Reshape_386145" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="1489" name="__module.model.layers.5.self_attn.o_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="1490" name="__module.model.layers.5.self_attn.o_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1434,1436,hidden_states.167"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="1491" name="__module.model.layers.5/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1439,1441,1452,hidden_states.169,hidden_states.171"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="1492" name="Constant_290107" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 5120" offset="1527050360" size="20480" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="1493" name="Constant_290106" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064860" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1494" name="Constant_290104" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064864" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1495" name="__module.model.layers.5.post_attention_layernorm/aten::pow/Power" type="Power" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1442"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="1496" name="Constant_4484" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64" names="1443"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1497" name="__module.model.layers.5.post_attention_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> + <data keep_dims="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1444,variance.23"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1498" name="Constant_290105" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064876" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1499" name="__module.model.layers.5.post_attention_layernorm/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1445"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1500" name="__module.model.layers.5.post_attention_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1501" name="__module.model.layers.5.post_attention_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1446"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1502" name="__module.model.layers.5.post_attention_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1447,1448,hidden_states.173,hidden_states.175"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="1503" name="__module.model.layers.5.post_attention_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1449,1451"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="1504" name="self.model.layers.5.mlp.gate_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 128" offset="1527070840" size="35389440" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1505" name="Convert_384747" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1506" name="self.model.layers.5.mlp.gate_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 1" offset="1562460280" size="276480" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1507" name="Convert_384749" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1508" name="self.model.layers.5.mlp.gate_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1509" name="self.model.layers.5.mlp.gate_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="13824, 40, 1" offset="1562736760" size="1105920" /> + <output> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1510" name="self.model.layers.5.mlp.gate_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1511" name="Constant_384754" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="848558152" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="1512" name="Reshape_384755" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="1513" name="__module.model.layers.5.mlp.gate_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="1514" name="__module.model.layers.5.mlp.gate_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1457,input.11"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="1515" name="__module.model.layers.5.mlp.act_fn/aten::silu/Swish" type="Swish" version="opset4"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="1458"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="1516" name="self.model.layers.5.mlp.up_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 128" offset="1563842680" size="35389440" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1517" name="Convert_384737" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1518" name="self.model.layers.5.mlp.up_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 1" offset="1599232120" size="276480" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1519" name="Convert_384739" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1520" name="self.model.layers.5.mlp.up_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1521" name="self.model.layers.5.mlp.up_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="13824, 40, 1" offset="1599508600" size="1105920" /> + <output> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1522" name="self.model.layers.5.mlp.up_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1523" name="Constant_384744" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="848558152" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="1524" name="Reshape_384745" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="1525" name="__module.model.layers.5.mlp.up_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="1526" name="__module.model.layers.5.mlp.up_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1460"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="1527" name="__module.model.layers.5.mlp/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1461"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="1528" name="self.model.layers.5.mlp.down_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 108, 128" offset="1600614520" size="35389440" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1529" name="Convert_384757" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1530" name="self.model.layers.5.mlp.down_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 108, 1" offset="1636003960" size="276480" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1531" name="Convert_384759" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1532" name="self.model.layers.5.mlp.down_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1533" name="self.model.layers.5.mlp.down_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="5120, 108, 1" offset="1636280440" size="1105920" /> + <output> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1534" name="self.model.layers.5.mlp.down_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1535" name="Constant_384764" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="922101848" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="1536" name="Reshape_384765" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="1537" name="__module.model.layers.5.mlp.down_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="1538" name="__module.model.layers.5.mlp.down_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1463,hidden_states.177"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="1539" name="__module.model.layers.5/aten::add/Add_1" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1464,1466,1474,1485,hidden_states.179,hidden_states.181"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="1540" name="Constant_290111" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 5120" offset="1637386360" size="20480" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="1541" name="Constant_290110" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064860" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1542" name="Constant_290108" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064864" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1543" name="__module.model.layers.6.input_layernorm/aten::pow/Power" type="Power" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1475"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="1544" name="Constant_4558" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64" names="1476"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1545" name="__module.model.layers.6.input_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> + <data keep_dims="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1477,variance.25"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1546" name="Constant_290109" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064876" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1547" name="__module.model.layers.6.input_layernorm/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1478"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1548" name="__module.model.layers.6.input_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1549" name="__module.model.layers.6.input_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1479"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1550" name="__module.model.layers.6.input_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1480,1481,hidden_states.183,hidden_states.185"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="1551" name="__module.model.layers.6.input_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1482,1484,hidden_states.187"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="1552" name="self.model.layers.6.self_attn.q_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 128" offset="1637406840" size="13107200" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1553" name="Convert_386147" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1554" name="self.model.layers.6.self_attn.q_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 1" offset="1650514040" size="102400" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1555" name="Convert_386149" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1556" name="self.model.layers.6.self_attn.q_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1557" name="self.model.layers.6.self_attn.q_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="5120, 40, 1" offset="1650616440" size="409600" /> + <output> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1558" name="self.model.layers.6.self_attn.q_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1559" name="Constant_386154" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="792684080" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="1560" name="Reshape_386155" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="1561" name="__module.model.layers.6.self_attn.q_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="1562" name="__module.model.layers.6.self_attn.q_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="1563" name="self.model.layers.6.self_attn.q_proj.bias" type="Const" version="opset1"> + <data element_type="bf16" shape="5120" offset="1651026040" size="10240" /> + <output> + <port id="0" precision="BF16" names="self.model.layers.6.self_attn.q_proj.bias"> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="1564" name="__module.model.layers.6.self_attn.q_proj/prim::PythonOp/ConvertLike_1" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="BF16"> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="1565" name="__module.model.layers.6.self_attn.q_proj/prim::PythonOp/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1494,query_states.13"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="1566" name="Constant_301733" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="792694336" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1567" name="__module.model.layers.6.self_attn/aten::view/Reshape" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1502"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1568" name="__module.model.layers.6.self_attn/aten::transpose/ScatterElementsUpdate" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1569" name="__module.model.layers.6.self_attn/aten::transpose/Transpose" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1503,q.13"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1570" name="__module.model.layers.6.self_attn/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1512"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1571" name="__module.model.layers.6.self_attn/aten::size/ShapeOf_3" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1572" name="__module.model.layers.6.self_attn/aten::size/Constant_3" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="1573" name="__module.model.layers.6.self_attn/aten::size/Gather_3" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="1513,1518" /> + </output> + </layer> + <layer id="1574" name="__module.model.layers.6.self_attn/aten::floor_divide/Divide_1" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" /> + </output> + </layer> + <layer id="1575" name="__module.model.layers.6.self_attn/aten::floor_divide/Floor_1" type="Floor" version="opset1"> + <input> + <port id="0" precision="I64" /> + </input> + <output> + <port id="1" precision="I64" names="1515,1516,1520,1521" /> + </output> + </layer> + <layer id="1576" name="Constant_220635" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1577" name="__module.model.layers.6.self_attn/aten::slice/Reshape_5" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1578" name="__module.model.layers.6.self_attn/aten::slice/Reshape_1" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694676" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1579" name="__module.model.layers.6.self_attn/aten::slice/Reshape_2" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1580" name="__module.model.layers.6.self_attn/aten::slice/Reshape_3" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1581" name="__module.model.layers.6.self_attn/aten::slice/Slice" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="1522,x2.25"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="1582" name="Constant_290112" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1, 1" offset="792694684" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1583" name="__module.model.layers.6.self_attn/aten::neg/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1523"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="1584" name="__module.model.layers.6.self_attn/aten::slice/Reshape_4" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1585" name="__module.model.layers.6.self_attn/aten::slice/Reshape_6" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1586" name="__module.model.layers.6.self_attn/aten::slice/Reshape_7" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1587" name="__module.model.layers.6.self_attn/aten::slice/Slice_1" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="1517"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="1588" name="__module.model.layers.6.self_attn/aten::cat/Concat" type="Concat" version="opset1"> + <data axis="-1" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1525"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1589" name="__module.model.layers.6.self_attn/aten::mul/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1526"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1590" name="__module.model.layers.6.self_attn/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1527"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1591" name="Constant_340931" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="1592" name="Constant_340924" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="12" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1593" name="Constant_340926" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1594" name="Constant_340928" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="20" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1595" name="Concat_340929" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1596" name="Broadcast_340932" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32" /> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1597" name="ReadValue_333252" type="ReadValue" version="opset6"> + <data variable_id="past_key_values.6.keypresent.6.key" variable_type="f32" variable_shape="?,8,?,128" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="past_key_values.6.key"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1598" name="Constant_325345" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="1599" name="Gather_325346" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1600" name="self.model.layers.6.self_attn.k_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 128" offset="1651036280" size="2621440" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1601" name="Convert_387107" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1602" name="self.model.layers.6.self_attn.k_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 1" offset="1653657720" size="20480" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1603" name="Convert_387109" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1604" name="self.model.layers.6.self_attn.k_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1605" name="self.model.layers.6.self_attn.k_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="1024, 40, 1" offset="1653678200" size="81920" /> + <output> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1606" name="self.model.layers.6.self_attn.k_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1607" name="Constant_387114" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795418528" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="1608" name="Reshape_387115" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="1609" name="__module.model.layers.6.self_attn.k_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="1610" name="__module.model.layers.6.self_attn.k_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="1611" name="self.model.layers.6.self_attn.k_proj.bias" type="Const" version="opset1"> + <data element_type="bf16" shape="1024" offset="1653760120" size="2048" /> + <output> + <port id="0" precision="BF16" names="self.model.layers.6.self_attn.k_proj.bias"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="1612" name="__module.model.layers.6.self_attn.k_proj/prim::PythonOp/ConvertLike_1" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="BF16"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="1613" name="__module.model.layers.6.self_attn.k_proj/prim::PythonOp/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1497,key_states.29"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="1614" name="Constant_301734" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420592" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1615" name="__module.model.layers.6.self_attn/aten::view/Reshape_1" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1505"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1616" name="__module.model.layers.6.self_attn/aten::transpose/ScatterElementsUpdate_1" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1617" name="__module.model.layers.6.self_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1506,k.13"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1618" name="__module.model.layers.6.self_attn/aten::mul/Multiply_2" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1528"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1619" name="__module.model.layers.6.self_attn/aten::size/ShapeOf_5" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1620" name="__module.model.layers.6.self_attn/aten::size/Constant_5" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="1621" name="__module.model.layers.6.self_attn/aten::size/Gather_5" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="1529,1534" /> + </output> + </layer> + <layer id="1622" name="__module.model.layers.6.self_attn/aten::floor_divide/Divide_3" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" /> + </output> + </layer> + <layer id="1623" name="__module.model.layers.6.self_attn/aten::floor_divide/Floor_3" type="Floor" version="opset1"> + <input> + <port id="0" precision="I64" /> + </input> + <output> + <port id="1" precision="I64" names="1531,1532,1536,1537" /> + </output> + </layer> + <layer id="1624" name="Constant_220636" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1625" name="__module.model.layers.6.self_attn/aten::slice/Reshape_13" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1626" name="__module.model.layers.6.self_attn/aten::slice/Reshape_9" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694676" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1627" name="__module.model.layers.6.self_attn/aten::slice/Reshape_10" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1628" name="__module.model.layers.6.self_attn/aten::slice/Reshape_11" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1629" name="__module.model.layers.6.self_attn/aten::slice/Slice_2" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="1538,x2.27"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="1630" name="Constant_290113" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1, 1" offset="792694684" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1631" name="__module.model.layers.6.self_attn/aten::neg/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1539"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="1632" name="__module.model.layers.6.self_attn/aten::slice/Reshape_12" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1633" name="__module.model.layers.6.self_attn/aten::slice/Reshape_14" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1634" name="__module.model.layers.6.self_attn/aten::slice/Reshape_15" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1635" name="__module.model.layers.6.self_attn/aten::slice/Slice_3" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="1533"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="1636" name="__module.model.layers.6.self_attn/aten::cat/Concat_1" type="Concat" version="opset1"> + <data axis="-1" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1541"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1637" name="__module.model.layers.6.self_attn/aten::mul/Multiply_3" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1542"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1638" name="__module.model.layers.6.self_attn/aten::add/Add_1" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1543"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1639" name="__module.model.layers.6.self_attn/aten::cat/Concat_2" type="Concat" version="opset1"> + <data axis="-2" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="present.6.key"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1640" name="__module.model.layers.6.self_attn/aten::unsqueeze/Unsqueeze_2" type="Unsqueeze" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="FP32" names="1555,1556,1557"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1641" name="__module.model.layers.6.self_attn/aten::size/ShapeOf_6" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1642" name="Constant_302394" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="938477672" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="1643" name="Constant_302395" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="1644" name="Gather_302396" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="1645" name="Constant_268050" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="795420624" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1646" name="Constant_276401" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795420632" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="1647" name="Constant_276402" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="1648" name="Gather_276403" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="1649" name="__module.model.layers.6.self_attn/prim::ListConstruct/Concat_2" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="3" precision="I64" names="1558"> + <dim>5</dim> + </port> + </output> + </layer> + <layer id="1650" name="__module.model.layers.6.self_attn/aten::expand/Broadcast" type="Broadcast" version="opset3"> + <data mode="bidirectional" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>5</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1559,hidden_states.191"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1651" name="Constant_301735" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420648" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1652" name="__module.model.layers.6.self_attn/aten::reshape/Reshape" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1563,key_states.31"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1653" name="Constant_340944" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="1654" name="Constant_340937" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="12" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1655" name="Constant_340939" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1656" name="Constant_340941" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="20" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1657" name="Concat_340942" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1658" name="Broadcast_340945" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32" /> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1659" name="ReadValue_333254" type="ReadValue" version="opset6"> + <data variable_id="past_key_values.6.valuepresent.6.value" variable_type="f32" variable_shape="?,8,?,128" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="past_key_values.6.value"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1660" name="Constant_325348" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="1661" name="Gather_325349" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1662" name="self.model.layers.6.self_attn.v_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 128" offset="1653762168" size="2621440" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1663" name="Convert_387117" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1664" name="self.model.layers.6.self_attn.v_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 1" offset="1656383608" size="20480" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1665" name="Convert_387119" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1666" name="self.model.layers.6.self_attn.v_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1667" name="self.model.layers.6.self_attn.v_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="1024, 40, 1" offset="1656404088" size="81920" /> + <output> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1668" name="self.model.layers.6.self_attn.v_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1669" name="Constant_387124" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795418528" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="1670" name="Reshape_387125" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="1671" name="__module.model.layers.6.self_attn.v_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="1672" name="__module.model.layers.6.self_attn.v_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="1673" name="self.model.layers.6.self_attn.v_proj.bias" type="Const" version="opset1"> + <data element_type="bf16" shape="1024" offset="1656486008" size="2048" /> + <output> + <port id="0" precision="BF16" names="self.model.layers.6.self_attn.v_proj.bias"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="1674" name="__module.model.layers.6.self_attn.v_proj/prim::PythonOp/ConvertLike_1" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="BF16"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="1675" name="__module.model.layers.6.self_attn.v_proj/prim::PythonOp/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1500,value_states.13"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="1676" name="Constant_301736" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420592" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1677" name="__module.model.layers.6.self_attn/aten::view/Reshape_2" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1508"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1678" name="__module.model.layers.6.self_attn/aten::transpose/ScatterElementsUpdate_2" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1679" name="__module.model.layers.6.self_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1509"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1680" name="__module.model.layers.6.self_attn/aten::cat/Concat_3" type="Concat" version="opset1"> + <data axis="-2" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="present.6.value"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1681" name="__module.model.layers.6.self_attn/aten::unsqueeze/Unsqueeze_3" type="Unsqueeze" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="FP32" names="1571,1572,1573"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1682" name="__module.model.layers.6.self_attn/aten::size/ShapeOf_10" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1683" name="Constant_302121" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1684" name="__module.model.layers.6.self_attn/aten::size/Constant_11" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="1685" name="__module.model.layers.6.self_attn/aten::size/Gather_11" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="1565"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1686" name="Constant_268068" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="795420624" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1687" name="Constant_276411" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795420632" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="1688" name="Constant_276412" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="1689" name="Gather_276413" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="1690" name="__module.model.layers.6.self_attn/prim::ListConstruct/Concat_5" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="4" precision="I64" names="1574"> + <dim>5</dim> + </port> + </output> + </layer> + <layer id="1691" name="__module.model.layers.6.self_attn/aten::expand/Broadcast_1" type="Broadcast" version="opset3"> + <data mode="bidirectional" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>5</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1575,hidden_states.195"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1692" name="Constant_301737" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420648" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1693" name="__module.model.layers.6.self_attn/aten::reshape/Reshape_1" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1579"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1694" name="__module.model.layers.6.self_attn/aten::slice/Reshape_60" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1695" name="ShapeOf_298096" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1696" name="Constant_298097" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694668" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1697" name="Constant_298098" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="1698" name="Gather_298099" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1699" name="ShapeOf_298100" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1700" name="Constant_298101" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694668" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1701" name="Constant_298102" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="1702" name="Gather_298103" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1703" name="Add_298104" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64" names="1580"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1704" name="__module.model.layers.6.self_attn/aten::slice/Reshape_62" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1705" name="__module.model.layers.6.self_attn/aten::slice/Reshape_63" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1706" name="__module.model.layers.6.self_attn/aten::slice/Slice_15" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="1584"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="1707" name="__module.model.layers.6.self_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> + <data causal="false" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="1585,attn_output.25"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1708" name="__module.model.layers.6.self_attn/aten::transpose/ScatterElementsUpdate_3" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1709" name="__module.model.layers.6.self_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1586"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1710" name="Constant_301738" type="Const" version="opset1"> + <data element_type="i64" shape="3" offset="798146608" size="24" /> + <output> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="1711" name="__module.model.layers.6.self_attn/aten::view/Reshape_3" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>3</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1589"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="1712" name="self.model.layers.6.self_attn.o_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 128" offset="1656488056" size="13107200" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1713" name="Convert_386157" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1714" name="self.model.layers.6.self_attn.o_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 1" offset="1669595256" size="102400" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1715" name="Convert_386159" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1716" name="self.model.layers.6.self_attn.o_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1717" name="self.model.layers.6.self_attn.o_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="5120, 40, 1" offset="1669697656" size="409600" /> + <output> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1718" name="self.model.layers.6.self_attn.o_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1719" name="Constant_386164" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="792684080" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="1720" name="Reshape_386165" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="1721" name="__module.model.layers.6.self_attn.o_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="1722" name="__module.model.layers.6.self_attn.o_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1591,1593,hidden_states.197"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="1723" name="__module.model.layers.6/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1596,1598,1609,hidden_states.199,hidden_states.201"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="1724" name="Constant_290117" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 5120" offset="1670107256" size="20480" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="1725" name="Constant_290116" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064860" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1726" name="Constant_290114" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064864" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1727" name="__module.model.layers.6.post_attention_layernorm/aten::pow/Power" type="Power" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1599"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="1728" name="Constant_5156" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64" names="1600"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1729" name="__module.model.layers.6.post_attention_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> + <data keep_dims="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1601,variance.27"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1730" name="Constant_290115" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064876" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1731" name="__module.model.layers.6.post_attention_layernorm/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1602"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1732" name="__module.model.layers.6.post_attention_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1733" name="__module.model.layers.6.post_attention_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1603"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1734" name="__module.model.layers.6.post_attention_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1604,1605,hidden_states.203,hidden_states.205"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="1735" name="__module.model.layers.6.post_attention_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1606,1608"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="1736" name="self.model.layers.6.mlp.gate_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 128" offset="1670127736" size="35389440" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1737" name="Convert_384777" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1738" name="self.model.layers.6.mlp.gate_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 1" offset="1705517176" size="276480" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1739" name="Convert_384779" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1740" name="self.model.layers.6.mlp.gate_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1741" name="self.model.layers.6.mlp.gate_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="13824, 40, 1" offset="1705793656" size="1105920" /> + <output> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1742" name="self.model.layers.6.mlp.gate_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1743" name="Constant_384784" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="848558152" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="1744" name="Reshape_384785" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="1745" name="__module.model.layers.6.mlp.gate_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="1746" name="__module.model.layers.6.mlp.gate_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1614,input.13"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="1747" name="__module.model.layers.6.mlp.act_fn/aten::silu/Swish" type="Swish" version="opset4"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="1615"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="1748" name="self.model.layers.6.mlp.up_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 128" offset="1706899576" size="35389440" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1749" name="Convert_384767" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1750" name="self.model.layers.6.mlp.up_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 1" offset="1742289016" size="276480" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1751" name="Convert_384769" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1752" name="self.model.layers.6.mlp.up_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1753" name="self.model.layers.6.mlp.up_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="13824, 40, 1" offset="1742565496" size="1105920" /> + <output> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1754" name="self.model.layers.6.mlp.up_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1755" name="Constant_384774" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="848558152" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="1756" name="Reshape_384775" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="1757" name="__module.model.layers.6.mlp.up_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="1758" name="__module.model.layers.6.mlp.up_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1617"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="1759" name="__module.model.layers.6.mlp/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1618"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="1760" name="self.model.layers.6.mlp.down_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 108, 128" offset="1743671416" size="35389440" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1761" name="Convert_384787" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1762" name="self.model.layers.6.mlp.down_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 108, 1" offset="1779060856" size="276480" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1763" name="Convert_384789" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1764" name="self.model.layers.6.mlp.down_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1765" name="self.model.layers.6.mlp.down_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="5120, 108, 1" offset="1779337336" size="1105920" /> + <output> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1766" name="self.model.layers.6.mlp.down_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1767" name="Constant_384794" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="922101848" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="1768" name="Reshape_384795" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="1769" name="__module.model.layers.6.mlp.down_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="1770" name="__module.model.layers.6.mlp.down_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1620,hidden_states.207"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="1771" name="__module.model.layers.6/aten::add/Add_1" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1621,1623,1631,1642,hidden_states.209,hidden_states.211"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="1772" name="Constant_290121" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 5120" offset="1780443256" size="20480" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="1773" name="Constant_290120" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064860" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1774" name="Constant_290118" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064864" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1775" name="__module.model.layers.7.input_layernorm/aten::pow/Power" type="Power" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1632"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="1776" name="Constant_5230" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64" names="1633"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1777" name="__module.model.layers.7.input_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> + <data keep_dims="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1634,variance.29"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1778" name="Constant_290119" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064876" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1779" name="__module.model.layers.7.input_layernorm/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1635"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1780" name="__module.model.layers.7.input_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1781" name="__module.model.layers.7.input_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1636"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1782" name="__module.model.layers.7.input_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1637,1638,hidden_states.213,hidden_states.215"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="1783" name="__module.model.layers.7.input_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1639,1641,hidden_states.217"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="1784" name="self.model.layers.7.self_attn.q_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 128" offset="1780463736" size="13107200" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1785" name="Convert_386167" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1786" name="self.model.layers.7.self_attn.q_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 1" offset="1793570936" size="102400" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1787" name="Convert_386169" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1788" name="self.model.layers.7.self_attn.q_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1789" name="self.model.layers.7.self_attn.q_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="5120, 40, 1" offset="1793673336" size="409600" /> + <output> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1790" name="self.model.layers.7.self_attn.q_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1791" name="Constant_386174" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="792684080" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="1792" name="Reshape_386175" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="1793" name="__module.model.layers.7.self_attn.q_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="1794" name="__module.model.layers.7.self_attn.q_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="1795" name="self.model.layers.7.self_attn.q_proj.bias" type="Const" version="opset1"> + <data element_type="bf16" shape="5120" offset="1794082936" size="10240" /> + <output> + <port id="0" precision="BF16" names="self.model.layers.7.self_attn.q_proj.bias"> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="1796" name="__module.model.layers.7.self_attn.q_proj/prim::PythonOp/ConvertLike_1" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="BF16"> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="1797" name="__module.model.layers.7.self_attn.q_proj/prim::PythonOp/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1651,query_states.15"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="1798" name="Constant_301739" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="792694336" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1799" name="__module.model.layers.7.self_attn/aten::view/Reshape" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1659"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1800" name="__module.model.layers.7.self_attn/aten::transpose/ScatterElementsUpdate" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1801" name="__module.model.layers.7.self_attn/aten::transpose/Transpose" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1660,q.15"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1802" name="__module.model.layers.7.self_attn/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1669"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1803" name="__module.model.layers.7.self_attn/aten::size/ShapeOf_3" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1804" name="__module.model.layers.7.self_attn/aten::size/Constant_3" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="1805" name="__module.model.layers.7.self_attn/aten::size/Gather_3" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="1670,1675" /> + </output> + </layer> + <layer id="1806" name="__module.model.layers.7.self_attn/aten::floor_divide/Divide_1" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" /> + </output> + </layer> + <layer id="1807" name="__module.model.layers.7.self_attn/aten::floor_divide/Floor_1" type="Floor" version="opset1"> + <input> + <port id="0" precision="I64" /> + </input> + <output> + <port id="1" precision="I64" names="1672,1673,1677,1678" /> + </output> + </layer> + <layer id="1808" name="Constant_220650" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1809" name="__module.model.layers.7.self_attn/aten::slice/Reshape_5" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1810" name="__module.model.layers.7.self_attn/aten::slice/Reshape_1" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694676" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1811" name="__module.model.layers.7.self_attn/aten::slice/Reshape_2" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1812" name="__module.model.layers.7.self_attn/aten::slice/Reshape_3" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1813" name="__module.model.layers.7.self_attn/aten::slice/Slice" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="1679,x2.29"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="1814" name="Constant_290122" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1, 1" offset="792694684" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1815" name="__module.model.layers.7.self_attn/aten::neg/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1680"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="1816" name="__module.model.layers.7.self_attn/aten::slice/Reshape_4" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1817" name="__module.model.layers.7.self_attn/aten::slice/Reshape_6" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1818" name="__module.model.layers.7.self_attn/aten::slice/Reshape_7" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1819" name="__module.model.layers.7.self_attn/aten::slice/Slice_1" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="1674"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="1820" name="__module.model.layers.7.self_attn/aten::cat/Concat" type="Concat" version="opset1"> + <data axis="-1" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1682"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1821" name="__module.model.layers.7.self_attn/aten::mul/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1683"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1822" name="__module.model.layers.7.self_attn/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1684"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1823" name="Constant_340957" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="1824" name="Constant_340950" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="12" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1825" name="Constant_340952" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1826" name="Constant_340954" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="20" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1827" name="Concat_340955" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1828" name="Broadcast_340958" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32" /> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1829" name="ReadValue_333256" type="ReadValue" version="opset6"> + <data variable_id="past_key_values.7.keypresent.7.key" variable_type="f32" variable_shape="?,8,?,128" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="past_key_values.7.key"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1830" name="Constant_325351" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="1831" name="Gather_325352" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1832" name="self.model.layers.7.self_attn.k_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 128" offset="1794093176" size="2621440" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1833" name="Convert_387127" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1834" name="self.model.layers.7.self_attn.k_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 1" offset="1796714616" size="20480" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1835" name="Convert_387129" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1836" name="self.model.layers.7.self_attn.k_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1837" name="self.model.layers.7.self_attn.k_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="1024, 40, 1" offset="1796735096" size="81920" /> + <output> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1838" name="self.model.layers.7.self_attn.k_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1839" name="Constant_387134" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795418528" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="1840" name="Reshape_387135" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="1841" name="__module.model.layers.7.self_attn.k_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="1842" name="__module.model.layers.7.self_attn.k_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="1843" name="self.model.layers.7.self_attn.k_proj.bias" type="Const" version="opset1"> + <data element_type="bf16" shape="1024" offset="1796817016" size="2048" /> + <output> + <port id="0" precision="BF16" names="self.model.layers.7.self_attn.k_proj.bias"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="1844" name="__module.model.layers.7.self_attn.k_proj/prim::PythonOp/ConvertLike_1" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="BF16"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="1845" name="__module.model.layers.7.self_attn.k_proj/prim::PythonOp/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1654,key_states.33"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="1846" name="Constant_301740" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420592" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1847" name="__module.model.layers.7.self_attn/aten::view/Reshape_1" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1662"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1848" name="__module.model.layers.7.self_attn/aten::transpose/ScatterElementsUpdate_1" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1849" name="__module.model.layers.7.self_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1663,k.15"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1850" name="__module.model.layers.7.self_attn/aten::mul/Multiply_2" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1685"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1851" name="__module.model.layers.7.self_attn/aten::size/ShapeOf_5" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1852" name="__module.model.layers.7.self_attn/aten::size/Constant_5" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="1853" name="__module.model.layers.7.self_attn/aten::size/Gather_5" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="1686,1691" /> + </output> + </layer> + <layer id="1854" name="__module.model.layers.7.self_attn/aten::floor_divide/Divide_3" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" /> + </output> + </layer> + <layer id="1855" name="__module.model.layers.7.self_attn/aten::floor_divide/Floor_3" type="Floor" version="opset1"> + <input> + <port id="0" precision="I64" /> + </input> + <output> + <port id="1" precision="I64" names="1688,1689,1693,1694" /> + </output> + </layer> + <layer id="1856" name="Constant_220651" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1857" name="__module.model.layers.7.self_attn/aten::slice/Reshape_13" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1858" name="__module.model.layers.7.self_attn/aten::slice/Reshape_9" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694676" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1859" name="__module.model.layers.7.self_attn/aten::slice/Reshape_10" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1860" name="__module.model.layers.7.self_attn/aten::slice/Reshape_11" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1861" name="__module.model.layers.7.self_attn/aten::slice/Slice_2" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="1695,x2.31"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="1862" name="Constant_290123" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1, 1" offset="792694684" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1863" name="__module.model.layers.7.self_attn/aten::neg/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1696"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="1864" name="__module.model.layers.7.self_attn/aten::slice/Reshape_12" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1865" name="__module.model.layers.7.self_attn/aten::slice/Reshape_14" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1866" name="__module.model.layers.7.self_attn/aten::slice/Reshape_15" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1867" name="__module.model.layers.7.self_attn/aten::slice/Slice_3" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="1690"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="1868" name="__module.model.layers.7.self_attn/aten::cat/Concat_1" type="Concat" version="opset1"> + <data axis="-1" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1698"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1869" name="__module.model.layers.7.self_attn/aten::mul/Multiply_3" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1699"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1870" name="__module.model.layers.7.self_attn/aten::add/Add_1" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1700"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1871" name="__module.model.layers.7.self_attn/aten::cat/Concat_2" type="Concat" version="opset1"> + <data axis="-2" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="present.7.key"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1872" name="__module.model.layers.7.self_attn/aten::unsqueeze/Unsqueeze_2" type="Unsqueeze" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="FP32" names="1712,1713,1714"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1873" name="__module.model.layers.7.self_attn/aten::size/ShapeOf_6" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1874" name="Constant_302399" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="938477672" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="1875" name="Constant_302400" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="1876" name="Gather_302401" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="1877" name="Constant_268086" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="795420624" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1878" name="Constant_276436" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795420632" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="1879" name="Constant_276437" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="1880" name="Gather_276438" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="1881" name="__module.model.layers.7.self_attn/prim::ListConstruct/Concat_2" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="3" precision="I64" names="1715"> + <dim>5</dim> + </port> + </output> + </layer> + <layer id="1882" name="__module.model.layers.7.self_attn/aten::expand/Broadcast" type="Broadcast" version="opset3"> + <data mode="bidirectional" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>5</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1716,hidden_states.221"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1883" name="Constant_301741" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420648" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1884" name="__module.model.layers.7.self_attn/aten::reshape/Reshape" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1720,key_states.35"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1885" name="Constant_340970" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="1886" name="Constant_340963" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="12" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1887" name="Constant_340965" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1888" name="Constant_340967" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="20" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1889" name="Concat_340968" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1890" name="Broadcast_340971" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32" /> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1891" name="ReadValue_333258" type="ReadValue" version="opset6"> + <data variable_id="past_key_values.7.valuepresent.7.value" variable_type="f32" variable_shape="?,8,?,128" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="past_key_values.7.value"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1892" name="Constant_325354" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="1893" name="Gather_325355" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1894" name="self.model.layers.7.self_attn.v_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 128" offset="1796819064" size="2621440" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1895" name="Convert_387137" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1896" name="self.model.layers.7.self_attn.v_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 1" offset="1799440504" size="20480" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1897" name="Convert_387139" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1898" name="self.model.layers.7.self_attn.v_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1899" name="self.model.layers.7.self_attn.v_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="1024, 40, 1" offset="1799460984" size="81920" /> + <output> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1900" name="self.model.layers.7.self_attn.v_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1901" name="Constant_387144" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795418528" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="1902" name="Reshape_387145" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="1903" name="__module.model.layers.7.self_attn.v_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="1904" name="__module.model.layers.7.self_attn.v_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="1905" name="self.model.layers.7.self_attn.v_proj.bias" type="Const" version="opset1"> + <data element_type="bf16" shape="1024" offset="1799542904" size="2048" /> + <output> + <port id="0" precision="BF16" names="self.model.layers.7.self_attn.v_proj.bias"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="1906" name="__module.model.layers.7.self_attn.v_proj/prim::PythonOp/ConvertLike_1" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="BF16"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="1907" name="__module.model.layers.7.self_attn.v_proj/prim::PythonOp/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1657,value_states.15"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="1908" name="Constant_301742" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420592" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1909" name="__module.model.layers.7.self_attn/aten::view/Reshape_2" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1665"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1910" name="__module.model.layers.7.self_attn/aten::transpose/ScatterElementsUpdate_2" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1911" name="__module.model.layers.7.self_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1666"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1912" name="__module.model.layers.7.self_attn/aten::cat/Concat_3" type="Concat" version="opset1"> + <data axis="-2" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="present.7.value"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1913" name="__module.model.layers.7.self_attn/aten::unsqueeze/Unsqueeze_3" type="Unsqueeze" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="FP32" names="1728,1729,1730"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1914" name="__module.model.layers.7.self_attn/aten::size/ShapeOf_10" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1915" name="Constant_302127" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1916" name="__module.model.layers.7.self_attn/aten::size/Constant_11" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="1917" name="__module.model.layers.7.self_attn/aten::size/Gather_11" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="1722"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1918" name="Constant_268104" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="795420624" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1919" name="Constant_276446" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795420632" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="1920" name="Constant_276447" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="1921" name="Gather_276448" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="1922" name="__module.model.layers.7.self_attn/prim::ListConstruct/Concat_5" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="4" precision="I64" names="1731"> + <dim>5</dim> + </port> + </output> + </layer> + <layer id="1923" name="__module.model.layers.7.self_attn/aten::expand/Broadcast_1" type="Broadcast" version="opset3"> + <data mode="bidirectional" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>5</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1732,hidden_states.225"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1924" name="Constant_301743" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420648" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1925" name="__module.model.layers.7.self_attn/aten::reshape/Reshape_1" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1736"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1926" name="__module.model.layers.7.self_attn/aten::slice/Reshape_60" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1927" name="ShapeOf_298182" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1928" name="Constant_298183" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694668" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1929" name="Constant_298184" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="1930" name="Gather_298185" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1931" name="ShapeOf_298186" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1932" name="Constant_298187" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694668" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1933" name="Constant_298188" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="1934" name="Gather_298189" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1935" name="Add_298190" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64" names="1737"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1936" name="__module.model.layers.7.self_attn/aten::slice/Reshape_62" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1937" name="__module.model.layers.7.self_attn/aten::slice/Reshape_63" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1938" name="__module.model.layers.7.self_attn/aten::slice/Slice_15" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="1741"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="1939" name="__module.model.layers.7.self_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> + <data causal="false" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="1742,attn_output.29"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1940" name="__module.model.layers.7.self_attn/aten::transpose/ScatterElementsUpdate_3" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="1941" name="__module.model.layers.7.self_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1743"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1942" name="Constant_301744" type="Const" version="opset1"> + <data element_type="i64" shape="3" offset="798146608" size="24" /> + <output> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="1943" name="__module.model.layers.7.self_attn/aten::view/Reshape_3" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>3</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1746"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="1944" name="self.model.layers.7.self_attn.o_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 128" offset="1799544952" size="13107200" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1945" name="Convert_386177" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1946" name="self.model.layers.7.self_attn.o_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 1" offset="1812652152" size="102400" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1947" name="Convert_386179" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1948" name="self.model.layers.7.self_attn.o_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1949" name="self.model.layers.7.self_attn.o_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="5120, 40, 1" offset="1812754552" size="409600" /> + <output> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1950" name="self.model.layers.7.self_attn.o_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1951" name="Constant_386184" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="792684080" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="1952" name="Reshape_386185" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="1953" name="__module.model.layers.7.self_attn.o_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="1954" name="__module.model.layers.7.self_attn.o_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1748,1750,hidden_states.227"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="1955" name="__module.model.layers.7/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1753,1755,1766,hidden_states.229,hidden_states.231"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="1956" name="Constant_290127" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 5120" offset="1813164152" size="20480" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="1957" name="Constant_290126" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064860" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1958" name="Constant_290124" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064864" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1959" name="__module.model.layers.7.post_attention_layernorm/aten::pow/Power" type="Power" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1756"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="1960" name="Constant_5828" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64" names="1757"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1961" name="__module.model.layers.7.post_attention_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> + <data keep_dims="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1758,variance.31"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1962" name="Constant_290125" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064876" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1963" name="__module.model.layers.7.post_attention_layernorm/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1759"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1964" name="__module.model.layers.7.post_attention_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1965" name="__module.model.layers.7.post_attention_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1760"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1966" name="__module.model.layers.7.post_attention_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1761,1762,hidden_states.233,hidden_states.235"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="1967" name="__module.model.layers.7.post_attention_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1763,1765"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="1968" name="self.model.layers.7.mlp.gate_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 128" offset="1813184632" size="35389440" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1969" name="Convert_384807" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1970" name="self.model.layers.7.mlp.gate_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 1" offset="1848574072" size="276480" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1971" name="Convert_384809" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1972" name="self.model.layers.7.mlp.gate_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1973" name="self.model.layers.7.mlp.gate_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="13824, 40, 1" offset="1848850552" size="1105920" /> + <output> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1974" name="self.model.layers.7.mlp.gate_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1975" name="Constant_384814" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="848558152" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="1976" name="Reshape_384815" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="1977" name="__module.model.layers.7.mlp.gate_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="1978" name="__module.model.layers.7.mlp.gate_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1771,input.15"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="1979" name="__module.model.layers.7.mlp.act_fn/aten::silu/Swish" type="Swish" version="opset4"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="1772"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="1980" name="self.model.layers.7.mlp.up_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 128" offset="1849956472" size="35389440" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1981" name="Convert_384797" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1982" name="self.model.layers.7.mlp.up_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 1" offset="1885345912" size="276480" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1983" name="Convert_384799" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1984" name="self.model.layers.7.mlp.up_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1985" name="self.model.layers.7.mlp.up_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="13824, 40, 1" offset="1885622392" size="1105920" /> + <output> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1986" name="self.model.layers.7.mlp.up_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1987" name="Constant_384804" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="848558152" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="1988" name="Reshape_384805" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="1989" name="__module.model.layers.7.mlp.up_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="1990" name="__module.model.layers.7.mlp.up_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1774"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="1991" name="__module.model.layers.7.mlp/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1775"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="1992" name="self.model.layers.7.mlp.down_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 108, 128" offset="1886728312" size="35389440" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1993" name="Convert_384817" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1994" name="self.model.layers.7.mlp.down_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 108, 1" offset="1922117752" size="276480" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1995" name="Convert_384819" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1996" name="self.model.layers.7.mlp.down_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1997" name="self.model.layers.7.mlp.down_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="5120, 108, 1" offset="1922394232" size="1105920" /> + <output> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="1998" name="self.model.layers.7.mlp.down_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="1999" name="Constant_384824" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="922101848" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="2000" name="Reshape_384825" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="2001" name="__module.model.layers.7.mlp.down_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="2002" name="__module.model.layers.7.mlp.down_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1777,hidden_states.237"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="2003" name="__module.model.layers.7/aten::add/Add_1" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1778,1780,1788,1799,hidden_states.239,hidden_states.241"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="2004" name="Constant_290131" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 5120" offset="1923500152" size="20480" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="2005" name="Constant_290130" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064860" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2006" name="Constant_290128" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064864" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2007" name="__module.model.layers.8.input_layernorm/aten::pow/Power" type="Power" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1789"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="2008" name="Constant_5902" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64" names="1790"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2009" name="__module.model.layers.8.input_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> + <data keep_dims="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1791,variance.33"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2010" name="Constant_290129" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064876" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2011" name="__module.model.layers.8.input_layernorm/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1792"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2012" name="__module.model.layers.8.input_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2013" name="__module.model.layers.8.input_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1793"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2014" name="__module.model.layers.8.input_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1794,1795,hidden_states.243,hidden_states.245"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="2015" name="__module.model.layers.8.input_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1796,1798,hidden_states.247"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="2016" name="self.model.layers.8.self_attn.q_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 128" offset="1923520632" size="13107200" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2017" name="Convert_386187" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2018" name="self.model.layers.8.self_attn.q_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 1" offset="1936627832" size="102400" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2019" name="Convert_386189" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2020" name="self.model.layers.8.self_attn.q_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2021" name="self.model.layers.8.self_attn.q_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="5120, 40, 1" offset="1936730232" size="409600" /> + <output> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2022" name="self.model.layers.8.self_attn.q_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2023" name="Constant_386194" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="792684080" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="2024" name="Reshape_386195" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="2025" name="__module.model.layers.8.self_attn.q_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="2026" name="__module.model.layers.8.self_attn.q_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="2027" name="self.model.layers.8.self_attn.q_proj.bias" type="Const" version="opset1"> + <data element_type="bf16" shape="5120" offset="1937139832" size="10240" /> + <output> + <port id="0" precision="BF16" names="self.model.layers.8.self_attn.q_proj.bias"> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="2028" name="__module.model.layers.8.self_attn.q_proj/prim::PythonOp/ConvertLike_1" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="BF16"> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="2029" name="__module.model.layers.8.self_attn.q_proj/prim::PythonOp/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1808,query_states.17"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="2030" name="Constant_301745" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="792694336" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2031" name="__module.model.layers.8.self_attn/aten::view/Reshape" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1816"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2032" name="__module.model.layers.8.self_attn/aten::transpose/ScatterElementsUpdate" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2033" name="__module.model.layers.8.self_attn/aten::transpose/Transpose" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1817,q.17"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2034" name="__module.model.layers.8.self_attn/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1826"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2035" name="__module.model.layers.8.self_attn/aten::size/ShapeOf_3" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2036" name="__module.model.layers.8.self_attn/aten::size/Constant_3" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="2037" name="__module.model.layers.8.self_attn/aten::size/Gather_3" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="1827,1832" /> + </output> + </layer> + <layer id="2038" name="__module.model.layers.8.self_attn/aten::floor_divide/Divide_1" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" /> + </output> + </layer> + <layer id="2039" name="__module.model.layers.8.self_attn/aten::floor_divide/Floor_1" type="Floor" version="opset1"> + <input> + <port id="0" precision="I64" /> + </input> + <output> + <port id="1" precision="I64" names="1829,1830,1834,1835" /> + </output> + </layer> + <layer id="2040" name="Constant_220665" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2041" name="__module.model.layers.8.self_attn/aten::slice/Reshape_5" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2042" name="__module.model.layers.8.self_attn/aten::slice/Reshape_1" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694676" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2043" name="__module.model.layers.8.self_attn/aten::slice/Reshape_2" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2044" name="__module.model.layers.8.self_attn/aten::slice/Reshape_3" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2045" name="__module.model.layers.8.self_attn/aten::slice/Slice" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="1836,x2.33"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="2046" name="Constant_290132" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1, 1" offset="792694684" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2047" name="__module.model.layers.8.self_attn/aten::neg/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1837"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="2048" name="__module.model.layers.8.self_attn/aten::slice/Reshape_4" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2049" name="__module.model.layers.8.self_attn/aten::slice/Reshape_6" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2050" name="__module.model.layers.8.self_attn/aten::slice/Reshape_7" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2051" name="__module.model.layers.8.self_attn/aten::slice/Slice_1" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="1831"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="2052" name="__module.model.layers.8.self_attn/aten::cat/Concat" type="Concat" version="opset1"> + <data axis="-1" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1839"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2053" name="__module.model.layers.8.self_attn/aten::mul/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1840"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2054" name="__module.model.layers.8.self_attn/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1841"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2055" name="Constant_340983" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="2056" name="Constant_340976" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="12" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2057" name="Constant_340978" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2058" name="Constant_340980" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="20" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2059" name="Concat_340981" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2060" name="Broadcast_340984" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32" /> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2061" name="ReadValue_333260" type="ReadValue" version="opset6"> + <data variable_id="past_key_values.8.keypresent.8.key" variable_type="f32" variable_shape="?,8,?,128" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="past_key_values.8.key"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2062" name="Constant_325357" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="2063" name="Gather_325358" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2064" name="self.model.layers.8.self_attn.k_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 128" offset="1937150072" size="2621440" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2065" name="Convert_387147" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2066" name="self.model.layers.8.self_attn.k_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 1" offset="1939771512" size="20480" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2067" name="Convert_387149" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2068" name="self.model.layers.8.self_attn.k_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2069" name="self.model.layers.8.self_attn.k_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="1024, 40, 1" offset="1939791992" size="81920" /> + <output> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2070" name="self.model.layers.8.self_attn.k_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2071" name="Constant_387154" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795418528" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="2072" name="Reshape_387155" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="2073" name="__module.model.layers.8.self_attn.k_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="2074" name="__module.model.layers.8.self_attn.k_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="2075" name="self.model.layers.8.self_attn.k_proj.bias" type="Const" version="opset1"> + <data element_type="bf16" shape="1024" offset="1939873912" size="2048" /> + <output> + <port id="0" precision="BF16" names="self.model.layers.8.self_attn.k_proj.bias"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="2076" name="__module.model.layers.8.self_attn.k_proj/prim::PythonOp/ConvertLike_1" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="BF16"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="2077" name="__module.model.layers.8.self_attn.k_proj/prim::PythonOp/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1811,key_states.37"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="2078" name="Constant_301746" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420592" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2079" name="__module.model.layers.8.self_attn/aten::view/Reshape_1" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1819"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2080" name="__module.model.layers.8.self_attn/aten::transpose/ScatterElementsUpdate_1" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2081" name="__module.model.layers.8.self_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1820,k.17"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2082" name="__module.model.layers.8.self_attn/aten::mul/Multiply_2" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1842"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2083" name="__module.model.layers.8.self_attn/aten::size/ShapeOf_5" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2084" name="__module.model.layers.8.self_attn/aten::size/Constant_5" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="2085" name="__module.model.layers.8.self_attn/aten::size/Gather_5" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="1843,1848" /> + </output> + </layer> + <layer id="2086" name="__module.model.layers.8.self_attn/aten::floor_divide/Divide_3" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" /> + </output> + </layer> + <layer id="2087" name="__module.model.layers.8.self_attn/aten::floor_divide/Floor_3" type="Floor" version="opset1"> + <input> + <port id="0" precision="I64" /> + </input> + <output> + <port id="1" precision="I64" names="1845,1846,1850,1851" /> + </output> + </layer> + <layer id="2088" name="Constant_220666" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2089" name="__module.model.layers.8.self_attn/aten::slice/Reshape_13" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2090" name="__module.model.layers.8.self_attn/aten::slice/Reshape_9" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694676" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2091" name="__module.model.layers.8.self_attn/aten::slice/Reshape_10" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2092" name="__module.model.layers.8.self_attn/aten::slice/Reshape_11" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2093" name="__module.model.layers.8.self_attn/aten::slice/Slice_2" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="1852,x2.35"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="2094" name="Constant_290133" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1, 1" offset="792694684" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2095" name="__module.model.layers.8.self_attn/aten::neg/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1853"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="2096" name="__module.model.layers.8.self_attn/aten::slice/Reshape_12" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2097" name="__module.model.layers.8.self_attn/aten::slice/Reshape_14" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2098" name="__module.model.layers.8.self_attn/aten::slice/Reshape_15" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2099" name="__module.model.layers.8.self_attn/aten::slice/Slice_3" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="1847"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="2100" name="__module.model.layers.8.self_attn/aten::cat/Concat_1" type="Concat" version="opset1"> + <data axis="-1" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1855"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2101" name="__module.model.layers.8.self_attn/aten::mul/Multiply_3" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1856"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2102" name="__module.model.layers.8.self_attn/aten::add/Add_1" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1857"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2103" name="__module.model.layers.8.self_attn/aten::cat/Concat_2" type="Concat" version="opset1"> + <data axis="-2" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="present.8.key"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2104" name="__module.model.layers.8.self_attn/aten::unsqueeze/Unsqueeze_2" type="Unsqueeze" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="FP32" names="1869,1870,1871"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2105" name="__module.model.layers.8.self_attn/aten::size/ShapeOf_6" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2106" name="Constant_302404" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="938477672" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="2107" name="Constant_302405" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="2108" name="Gather_302406" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="2109" name="Constant_268122" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="795420624" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2110" name="Constant_276471" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795420632" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="2111" name="Constant_276472" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="2112" name="Gather_276473" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="2113" name="__module.model.layers.8.self_attn/prim::ListConstruct/Concat_2" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="3" precision="I64" names="1872"> + <dim>5</dim> + </port> + </output> + </layer> + <layer id="2114" name="__module.model.layers.8.self_attn/aten::expand/Broadcast" type="Broadcast" version="opset3"> + <data mode="bidirectional" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>5</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1873,hidden_states.251"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2115" name="Constant_301747" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420648" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2116" name="__module.model.layers.8.self_attn/aten::reshape/Reshape" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1877,key_states.39"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2117" name="Constant_340996" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="2118" name="Constant_340989" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="12" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2119" name="Constant_340991" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2120" name="Constant_340993" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="20" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2121" name="Concat_340994" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2122" name="Broadcast_340997" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32" /> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2123" name="ReadValue_333262" type="ReadValue" version="opset6"> + <data variable_id="past_key_values.8.valuepresent.8.value" variable_type="f32" variable_shape="?,8,?,128" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="past_key_values.8.value"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2124" name="Constant_325360" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="2125" name="Gather_325361" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2126" name="self.model.layers.8.self_attn.v_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 128" offset="1939875960" size="2621440" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2127" name="Convert_387157" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2128" name="self.model.layers.8.self_attn.v_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 1" offset="1942497400" size="20480" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2129" name="Convert_387159" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2130" name="self.model.layers.8.self_attn.v_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2131" name="self.model.layers.8.self_attn.v_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="1024, 40, 1" offset="1942517880" size="81920" /> + <output> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2132" name="self.model.layers.8.self_attn.v_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2133" name="Constant_387164" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795418528" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="2134" name="Reshape_387165" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="2135" name="__module.model.layers.8.self_attn.v_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="2136" name="__module.model.layers.8.self_attn.v_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="2137" name="self.model.layers.8.self_attn.v_proj.bias" type="Const" version="opset1"> + <data element_type="bf16" shape="1024" offset="1942599800" size="2048" /> + <output> + <port id="0" precision="BF16" names="self.model.layers.8.self_attn.v_proj.bias"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="2138" name="__module.model.layers.8.self_attn.v_proj/prim::PythonOp/ConvertLike_1" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="BF16"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="2139" name="__module.model.layers.8.self_attn.v_proj/prim::PythonOp/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1814,value_states.17"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="2140" name="Constant_301748" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420592" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2141" name="__module.model.layers.8.self_attn/aten::view/Reshape_2" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1822"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2142" name="__module.model.layers.8.self_attn/aten::transpose/ScatterElementsUpdate_2" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2143" name="__module.model.layers.8.self_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1823"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2144" name="__module.model.layers.8.self_attn/aten::cat/Concat_3" type="Concat" version="opset1"> + <data axis="-2" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="present.8.value"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2145" name="__module.model.layers.8.self_attn/aten::unsqueeze/Unsqueeze_3" type="Unsqueeze" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="FP32" names="1885,1886,1887"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2146" name="__module.model.layers.8.self_attn/aten::size/ShapeOf_10" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2147" name="Constant_302133" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2148" name="__module.model.layers.8.self_attn/aten::size/Constant_11" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="2149" name="__module.model.layers.8.self_attn/aten::size/Gather_11" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="1879"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2150" name="Constant_268140" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="795420624" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2151" name="Constant_276481" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795420632" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="2152" name="Constant_276482" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="2153" name="Gather_276483" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="2154" name="__module.model.layers.8.self_attn/prim::ListConstruct/Concat_5" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="4" precision="I64" names="1888"> + <dim>5</dim> + </port> + </output> + </layer> + <layer id="2155" name="__module.model.layers.8.self_attn/aten::expand/Broadcast_1" type="Broadcast" version="opset3"> + <data mode="bidirectional" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>5</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1889,hidden_states.255"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2156" name="Constant_301749" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420648" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2157" name="__module.model.layers.8.self_attn/aten::reshape/Reshape_1" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1893"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2158" name="__module.model.layers.8.self_attn/aten::slice/Reshape_60" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2159" name="ShapeOf_298268" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2160" name="Constant_298269" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694668" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2161" name="Constant_298270" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="2162" name="Gather_298271" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2163" name="ShapeOf_298272" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2164" name="Constant_298273" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694668" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2165" name="Constant_298274" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="2166" name="Gather_298275" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2167" name="Add_298276" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64" names="1894"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2168" name="__module.model.layers.8.self_attn/aten::slice/Reshape_62" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2169" name="__module.model.layers.8.self_attn/aten::slice/Reshape_63" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2170" name="__module.model.layers.8.self_attn/aten::slice/Slice_15" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="1898"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="2171" name="__module.model.layers.8.self_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> + <data causal="false" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="1899,attn_output.33"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2172" name="__module.model.layers.8.self_attn/aten::transpose/ScatterElementsUpdate_3" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2173" name="__module.model.layers.8.self_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1900"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2174" name="Constant_301750" type="Const" version="opset1"> + <data element_type="i64" shape="3" offset="798146608" size="24" /> + <output> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="2175" name="__module.model.layers.8.self_attn/aten::view/Reshape_3" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>3</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1903"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="2176" name="self.model.layers.8.self_attn.o_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 128" offset="1942601848" size="13107200" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2177" name="Convert_386197" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2178" name="self.model.layers.8.self_attn.o_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 1" offset="1955709048" size="102400" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2179" name="Convert_386199" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2180" name="self.model.layers.8.self_attn.o_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2181" name="self.model.layers.8.self_attn.o_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="5120, 40, 1" offset="1955811448" size="409600" /> + <output> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2182" name="self.model.layers.8.self_attn.o_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2183" name="Constant_386204" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="792684080" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="2184" name="Reshape_386205" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="2185" name="__module.model.layers.8.self_attn.o_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="2186" name="__module.model.layers.8.self_attn.o_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1905,1907,hidden_states.257"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="2187" name="__module.model.layers.8/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1910,1912,1923,hidden_states.259,hidden_states.261"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="2188" name="Constant_290137" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 5120" offset="1956221048" size="20480" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="2189" name="Constant_290136" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064860" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2190" name="Constant_290134" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064864" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2191" name="__module.model.layers.8.post_attention_layernorm/aten::pow/Power" type="Power" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1913"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="2192" name="Constant_6500" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64" names="1914"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2193" name="__module.model.layers.8.post_attention_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> + <data keep_dims="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1915,variance.35"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2194" name="Constant_290135" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064876" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2195" name="__module.model.layers.8.post_attention_layernorm/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1916"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2196" name="__module.model.layers.8.post_attention_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2197" name="__module.model.layers.8.post_attention_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1917"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2198" name="__module.model.layers.8.post_attention_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1918,1919,hidden_states.263,hidden_states.265"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="2199" name="__module.model.layers.8.post_attention_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1920,1922"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="2200" name="self.model.layers.8.mlp.gate_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 128" offset="1956241528" size="35389440" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2201" name="Convert_384837" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2202" name="self.model.layers.8.mlp.gate_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 1" offset="1991630968" size="276480" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2203" name="Convert_384839" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2204" name="self.model.layers.8.mlp.gate_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2205" name="self.model.layers.8.mlp.gate_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="13824, 40, 1" offset="1991907448" size="1105920" /> + <output> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2206" name="self.model.layers.8.mlp.gate_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2207" name="Constant_384844" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="848558152" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="2208" name="Reshape_384845" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="2209" name="__module.model.layers.8.mlp.gate_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="2210" name="__module.model.layers.8.mlp.gate_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1928,input.17"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="2211" name="__module.model.layers.8.mlp.act_fn/aten::silu/Swish" type="Swish" version="opset4"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="1929"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="2212" name="self.model.layers.8.mlp.up_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 128" offset="1993013368" size="35389440" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2213" name="Convert_384827" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2214" name="self.model.layers.8.mlp.up_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 1" offset="2028402808" size="276480" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2215" name="Convert_384829" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2216" name="self.model.layers.8.mlp.up_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2217" name="self.model.layers.8.mlp.up_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="13824, 40, 1" offset="2028679288" size="1105920" /> + <output> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2218" name="self.model.layers.8.mlp.up_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2219" name="Constant_384834" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="848558152" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="2220" name="Reshape_384835" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="2221" name="__module.model.layers.8.mlp.up_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="2222" name="__module.model.layers.8.mlp.up_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1931"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="2223" name="__module.model.layers.8.mlp/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1932"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="2224" name="self.model.layers.8.mlp.down_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 108, 128" offset="2029785208" size="35389440" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2225" name="Convert_384847" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2226" name="self.model.layers.8.mlp.down_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 108, 1" offset="2065174648" size="276480" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2227" name="Convert_384849" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2228" name="self.model.layers.8.mlp.down_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2229" name="self.model.layers.8.mlp.down_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="5120, 108, 1" offset="2065451128" size="1105920" /> + <output> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2230" name="self.model.layers.8.mlp.down_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2231" name="Constant_384854" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="922101848" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="2232" name="Reshape_384855" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="2233" name="__module.model.layers.8.mlp.down_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="2234" name="__module.model.layers.8.mlp.down_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1934,hidden_states.267"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="2235" name="__module.model.layers.8/aten::add/Add_1" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1935,1937,1945,1956,hidden_states.269,hidden_states.271"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="2236" name="Constant_290140" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064860" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2237" name="Constant_290138" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064864" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2238" name="__module.model.layers.9.input_layernorm/aten::pow/Power" type="Power" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1946"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="2239" name="Constant_6574" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64" names="1947"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2240" name="__module.model.layers.9.input_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> + <data keep_dims="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1948,variance.37"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2241" name="Constant_290139" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064876" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2242" name="__module.model.layers.9.input_layernorm/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1949"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2243" name="__module.model.layers.9.input_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2244" name="__module.model.layers.9.input_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1950"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2245" name="__module.model.layers.9.input_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1951,1952,hidden_states.273,hidden_states.275"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="2246" name="__module.model.layers.9.input_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1953,1955,hidden_states.277"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="2247" name="self.model.layers.9.self_attn.v_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 128" offset="2066557048" size="2621440" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2248" name="Convert_387167" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2249" name="self.model.layers.9.self_attn.v_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 1" offset="2069178488" size="20480" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2250" name="Convert_387169" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2251" name="self.model.layers.9.self_attn.v_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2252" name="self.model.layers.9.self_attn.v_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="1024, 40, 1" offset="2069198968" size="81920" /> + <output> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2253" name="self.model.layers.9.self_attn.v_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2254" name="Constant_387174" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795418528" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="2255" name="Reshape_387175" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="2256" name="__module.model.layers.9.self_attn.v_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="2257" name="__module.model.layers.9.self_attn.v_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="2258" name="self.model.layers.9.self_attn.v_proj.bias" type="Const" version="opset1"> + <data element_type="bf16" shape="1024" offset="2069280888" size="2048" /> + <output> + <port id="0" precision="BF16" names="self.model.layers.9.self_attn.v_proj.bias"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="2259" name="__module.model.layers.9.self_attn.v_proj/prim::PythonOp/ConvertLike_1" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="BF16"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="2260" name="__module.model.layers.9.self_attn.v_proj/prim::PythonOp/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1971,value_states.19"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="2261" name="Constant_301754" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420592" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2262" name="__module.model.layers.9.self_attn/aten::view/Reshape_2" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1979"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2263" name="__module.model.layers.9.self_attn/aten::transpose/ScatterElementsUpdate_2" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2264" name="__module.model.layers.9.self_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1980"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2265" name="__module.model.layers.9.self_attn/aten::cat/Concat_3" type="Concat" version="opset1"> + <data axis="-2" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="present.9.value"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2267" name="Constant_341009" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="2268" name="Constant_341002" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="12" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2269" name="Constant_341004" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2270" name="Constant_341006" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="20" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2271" name="Concat_341007" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2272" name="Broadcast_341010" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32" /> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2273" name="ReadValue_333264" type="ReadValue" version="opset6"> + <data variable_id="past_key_values.9.keypresent.9.key" variable_type="f32" variable_shape="?,8,?,128" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="past_key_values.9.key"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2274" name="Constant_325363" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="2275" name="Gather_325364" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2276" name="self.model.layers.9.self_attn.k_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 128" offset="2069282936" size="2621440" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2277" name="Convert_387177" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2278" name="self.model.layers.9.self_attn.k_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 1" offset="2071904376" size="20480" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2279" name="Convert_387179" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2280" name="self.model.layers.9.self_attn.k_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2281" name="self.model.layers.9.self_attn.k_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="1024, 40, 1" offset="2071924856" size="81920" /> + <output> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2282" name="self.model.layers.9.self_attn.k_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2283" name="Constant_387184" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795418528" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="2284" name="Reshape_387185" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="2285" name="__module.model.layers.9.self_attn.k_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="2286" name="__module.model.layers.9.self_attn.k_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="2287" name="self.model.layers.9.self_attn.k_proj.bias" type="Const" version="opset1"> + <data element_type="bf16" shape="1024" offset="2072006776" size="2048" /> + <output> + <port id="0" precision="BF16" names="self.model.layers.9.self_attn.k_proj.bias"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="2288" name="__module.model.layers.9.self_attn.k_proj/prim::PythonOp/ConvertLike_1" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="BF16"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="2289" name="__module.model.layers.9.self_attn.k_proj/prim::PythonOp/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1968,key_states.41"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="2290" name="Constant_301752" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420592" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2291" name="__module.model.layers.9.self_attn/aten::view/Reshape_1" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1976"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2292" name="__module.model.layers.9.self_attn/aten::transpose/ScatterElementsUpdate_1" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2293" name="__module.model.layers.9.self_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1977,k.19"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2294" name="__module.model.layers.9.self_attn/aten::mul/Multiply_2" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1999"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2295" name="__module.model.layers.9.self_attn/aten::size/ShapeOf_5" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2296" name="__module.model.layers.9.self_attn/aten::size/Constant_5" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="2297" name="__module.model.layers.9.self_attn/aten::size/Gather_5" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="2000,2005" /> + </output> + </layer> + <layer id="2298" name="__module.model.layers.9.self_attn/aten::floor_divide/Divide_3" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" /> + </output> + </layer> + <layer id="2299" name="__module.model.layers.9.self_attn/aten::floor_divide/Floor_3" type="Floor" version="opset1"> + <input> + <port id="0" precision="I64" /> + </input> + <output> + <port id="1" precision="I64" names="2002,2003,2007,2008" /> + </output> + </layer> + <layer id="2300" name="Constant_220681" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2301" name="__module.model.layers.9.self_attn/aten::slice/Reshape_13" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2302" name="__module.model.layers.9.self_attn/aten::slice/Reshape_9" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694676" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2303" name="__module.model.layers.9.self_attn/aten::slice/Reshape_10" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2304" name="__module.model.layers.9.self_attn/aten::slice/Reshape_11" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2305" name="__module.model.layers.9.self_attn/aten::slice/Slice_2" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="2009,x2.39"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="2306" name="Constant_290143" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1, 1" offset="792694684" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2307" name="__module.model.layers.9.self_attn/aten::neg/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2010"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="2308" name="__module.model.layers.9.self_attn/aten::slice/Reshape_12" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2309" name="__module.model.layers.9.self_attn/aten::slice/Reshape_14" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2310" name="__module.model.layers.9.self_attn/aten::slice/Reshape_15" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2311" name="__module.model.layers.9.self_attn/aten::slice/Slice_3" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="2004"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="2312" name="__module.model.layers.9.self_attn/aten::cat/Concat_1" type="Concat" version="opset1"> + <data axis="-1" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2012"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2313" name="__module.model.layers.9.self_attn/aten::mul/Multiply_3" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2013"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2314" name="__module.model.layers.9.self_attn/aten::add/Add_1" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2014"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2315" name="__module.model.layers.9.self_attn/aten::cat/Concat_2" type="Concat" version="opset1"> + <data axis="-2" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="present.9.key"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2325" name="Constant_341022" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="2326" name="Constant_341015" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="12" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2327" name="Constant_341017" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2328" name="Constant_341019" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="20" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2329" name="Concat_341020" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2330" name="Broadcast_341023" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32" /> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2331" name="ReadValue_333246" type="ReadValue" version="opset6"> + <data variable_id="past_key_values.47.valuepresent.47.value" variable_type="f32" variable_shape="?,8,?,128" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="past_key_values.47.value"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2332" name="Constant_325594" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="2333" name="Gather_325595" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2334" name="Constant_290521" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 5120" offset="2072008824" size="20480" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="2335" name="self.model.layers.9.self_attn.q_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 128" offset="2072029304" size="13107200" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2336" name="Convert_386207" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2337" name="self.model.layers.9.self_attn.q_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 1" offset="2085136504" size="102400" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2338" name="Convert_386209" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2339" name="self.model.layers.9.self_attn.q_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2340" name="self.model.layers.9.self_attn.q_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="5120, 40, 1" offset="2085238904" size="409600" /> + <output> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2341" name="self.model.layers.9.self_attn.q_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2342" name="Constant_386214" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="792684080" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="2343" name="Reshape_386215" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="2344" name="__module.model.layers.9.self_attn.q_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="2345" name="__module.model.layers.9.self_attn.q_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="2346" name="self.model.layers.9.self_attn.q_proj.bias" type="Const" version="opset1"> + <data element_type="bf16" shape="5120" offset="2085648504" size="10240" /> + <output> + <port id="0" precision="BF16" names="self.model.layers.9.self_attn.q_proj.bias"> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="2347" name="__module.model.layers.9.self_attn.q_proj/prim::PythonOp/ConvertLike_1" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="BF16"> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="2348" name="__module.model.layers.9.self_attn.q_proj/prim::PythonOp/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1965,query_states.19"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="2349" name="Constant_301751" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="792694336" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2350" name="__module.model.layers.9.self_attn/aten::view/Reshape" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1973"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2351" name="__module.model.layers.9.self_attn/aten::transpose/ScatterElementsUpdate" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2352" name="__module.model.layers.9.self_attn/aten::transpose/Transpose" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1974,q.19"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2353" name="__module.model.layers.9.self_attn/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1983"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2354" name="__module.model.layers.9.self_attn/aten::size/ShapeOf_3" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2355" name="__module.model.layers.9.self_attn/aten::size/Constant_3" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="2356" name="__module.model.layers.9.self_attn/aten::size/Gather_3" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="1984,1989" /> + </output> + </layer> + <layer id="2357" name="__module.model.layers.9.self_attn/aten::floor_divide/Divide_1" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" /> + </output> + </layer> + <layer id="2358" name="__module.model.layers.9.self_attn/aten::floor_divide/Floor_1" type="Floor" version="opset1"> + <input> + <port id="0" precision="I64" /> + </input> + <output> + <port id="1" precision="I64" names="1986,1987,1991,1992" /> + </output> + </layer> + <layer id="2359" name="Constant_220680" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2360" name="__module.model.layers.9.self_attn/aten::slice/Reshape_5" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2361" name="__module.model.layers.9.self_attn/aten::slice/Reshape_1" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694676" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2362" name="__module.model.layers.9.self_attn/aten::slice/Reshape_2" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2363" name="__module.model.layers.9.self_attn/aten::slice/Reshape_3" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2364" name="__module.model.layers.9.self_attn/aten::slice/Slice" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="1993,x2.37"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="2365" name="Constant_290142" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1, 1" offset="792694684" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2366" name="__module.model.layers.9.self_attn/aten::neg/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1994"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="2367" name="__module.model.layers.9.self_attn/aten::slice/Reshape_4" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2368" name="__module.model.layers.9.self_attn/aten::slice/Reshape_6" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2369" name="__module.model.layers.9.self_attn/aten::slice/Reshape_7" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2370" name="__module.model.layers.9.self_attn/aten::slice/Slice_1" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="1988"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="2371" name="__module.model.layers.9.self_attn/aten::cat/Concat" type="Concat" version="opset1"> + <data axis="-1" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1996"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2372" name="__module.model.layers.9.self_attn/aten::mul/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1997"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2373" name="__module.model.layers.9.self_attn/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="1998"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2374" name="__module.model.layers.9.self_attn/aten::unsqueeze/Unsqueeze_2" type="Unsqueeze" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="FP32" names="2026,2027,2028"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2375" name="__module.model.layers.9.self_attn/aten::size/ShapeOf_6" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2376" name="Constant_302409" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="938477672" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="2377" name="Constant_302410" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="2378" name="Gather_302411" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="2379" name="Constant_268158" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="795420624" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2380" name="Constant_276506" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795420632" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="2381" name="Constant_276507" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="2382" name="Gather_276508" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="2383" name="__module.model.layers.9.self_attn/prim::ListConstruct/Concat_2" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="3" precision="I64" names="2029"> + <dim>5</dim> + </port> + </output> + </layer> + <layer id="2384" name="__module.model.layers.9.self_attn/aten::expand/Broadcast" type="Broadcast" version="opset3"> + <data mode="bidirectional" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>5</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2030,hidden_states.281"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2385" name="Constant_301753" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420648" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2386" name="__module.model.layers.9.self_attn/aten::reshape/Reshape" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2034,key_states.43"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2387" name="__module.model.layers.9.self_attn/aten::unsqueeze/Unsqueeze_3" type="Unsqueeze" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="FP32" names="2042,2043,2044"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2388" name="__module.model.layers.9.self_attn/aten::size/ShapeOf_10" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2389" name="Constant_302139" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2390" name="__module.model.layers.9.self_attn/aten::size/Constant_11" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="2391" name="__module.model.layers.9.self_attn/aten::size/Gather_11" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="2036"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2392" name="Constant_268176" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="795420624" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2393" name="Constant_276516" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795420632" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="2394" name="Constant_276517" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="2395" name="Gather_276518" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="2396" name="__module.model.layers.9.self_attn/prim::ListConstruct/Concat_5" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="4" precision="I64" names="2045"> + <dim>5</dim> + </port> + </output> + </layer> + <layer id="2397" name="__module.model.layers.9.self_attn/aten::expand/Broadcast_1" type="Broadcast" version="opset3"> + <data mode="bidirectional" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>5</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2046,hidden_states.285"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2398" name="Constant_301755" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420648" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2399" name="__module.model.layers.9.self_attn/aten::reshape/Reshape_1" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2050"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2400" name="__module.model.layers.9.self_attn/aten::slice/Reshape_60" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2401" name="ShapeOf_298354" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2402" name="Constant_298355" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694668" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2403" name="Constant_298356" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="2404" name="Gather_298357" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2405" name="ShapeOf_298358" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2406" name="Constant_298359" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694668" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2407" name="Constant_298360" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="2408" name="Gather_298361" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2409" name="Add_298362" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64" names="2051"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2410" name="__module.model.layers.9.self_attn/aten::slice/Reshape_62" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2411" name="__module.model.layers.9.self_attn/aten::slice/Reshape_63" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2412" name="__module.model.layers.9.self_attn/aten::slice/Slice_15" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="2055"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="2413" name="__module.model.layers.9.self_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> + <data causal="false" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="2056,attn_output.37"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2414" name="__module.model.layers.9.self_attn/aten::transpose/ScatterElementsUpdate_3" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2415" name="__module.model.layers.9.self_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2057"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2416" name="Constant_301756" type="Const" version="opset1"> + <data element_type="i64" shape="3" offset="798146608" size="24" /> + <output> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="2417" name="__module.model.layers.9.self_attn/aten::view/Reshape_3" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>3</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2060"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="2418" name="self.model.layers.9.self_attn.o_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 128" offset="2085658744" size="13107200" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2419" name="Convert_386217" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2420" name="self.model.layers.9.self_attn.o_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 1" offset="2098765944" size="102400" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2421" name="Convert_386219" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2422" name="self.model.layers.9.self_attn.o_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2423" name="self.model.layers.9.self_attn.o_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="5120, 40, 1" offset="2098868344" size="409600" /> + <output> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2424" name="self.model.layers.9.self_attn.o_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2425" name="Constant_386224" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="792684080" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="2426" name="Reshape_386225" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="2427" name="__module.model.layers.9.self_attn.o_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="2428" name="__module.model.layers.9.self_attn.o_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2062,2064,hidden_states.287"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="2429" name="__module.model.layers.9/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2067,2069,2080,hidden_states.289,hidden_states.291"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="2430" name="Constant_290147" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 5120" offset="2099277944" size="20480" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="2431" name="Constant_290146" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064860" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2432" name="Constant_290144" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064864" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2433" name="__module.model.layers.9.post_attention_layernorm/aten::pow/Power" type="Power" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2070"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="2434" name="Constant_7172" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64" names="2071"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2435" name="__module.model.layers.9.post_attention_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> + <data keep_dims="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2072,variance.39"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2436" name="Constant_290145" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064876" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2437" name="__module.model.layers.9.post_attention_layernorm/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2073"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2438" name="__module.model.layers.9.post_attention_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2439" name="__module.model.layers.9.post_attention_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2074"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2440" name="__module.model.layers.9.post_attention_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2075,2076,hidden_states.293,hidden_states.295"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="2441" name="__module.model.layers.9.post_attention_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2077,2079"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="2442" name="self.model.layers.9.mlp.gate_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 128" offset="2099298424" size="35389440" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2443" name="Convert_384867" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2444" name="self.model.layers.9.mlp.gate_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 1" offset="2134687864" size="276480" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2445" name="Convert_384869" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2446" name="self.model.layers.9.mlp.gate_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2447" name="self.model.layers.9.mlp.gate_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="13824, 40, 1" offset="2134964344" size="1105920" /> + <output> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2448" name="self.model.layers.9.mlp.gate_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2449" name="Constant_384874" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="848558152" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="2450" name="Reshape_384875" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="2451" name="__module.model.layers.9.mlp.gate_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="2452" name="__module.model.layers.9.mlp.gate_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2085,input.19"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="2453" name="__module.model.layers.9.mlp.act_fn/aten::silu/Swish" type="Swish" version="opset4"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="2086"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="2454" name="self.model.layers.9.mlp.up_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 128" offset="2136070264" size="35389440" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2455" name="Convert_384857" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2456" name="self.model.layers.9.mlp.up_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 1" offset="2171459704" size="276480" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2457" name="Convert_384859" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2458" name="self.model.layers.9.mlp.up_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2459" name="self.model.layers.9.mlp.up_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="13824, 40, 1" offset="2171736184" size="1105920" /> + <output> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2460" name="self.model.layers.9.mlp.up_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2461" name="Constant_384864" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="848558152" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="2462" name="Reshape_384865" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="2463" name="__module.model.layers.9.mlp.up_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="2464" name="__module.model.layers.9.mlp.up_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2088"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="2465" name="__module.model.layers.9.mlp/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2089"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="2466" name="self.model.layers.9.mlp.down_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 108, 128" offset="2172842104" size="35389440" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2467" name="Convert_384877" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2468" name="self.model.layers.9.mlp.down_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 108, 1" offset="2208231544" size="276480" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2469" name="Convert_384879" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2470" name="self.model.layers.9.mlp.down_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2471" name="self.model.layers.9.mlp.down_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="5120, 108, 1" offset="2208508024" size="1105920" /> + <output> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2472" name="self.model.layers.9.mlp.down_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2473" name="Constant_384884" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="922101848" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="2474" name="Reshape_384885" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="2475" name="__module.model.layers.9.mlp.down_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="2476" name="__module.model.layers.9.mlp.down_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2091,hidden_states.297"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="2477" name="__module.model.layers.9/aten::add/Add_1" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2092,2094,2102,2113,hidden_states.299,hidden_states.301"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="2478" name="Constant_290151" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 5120" offset="2209613944" size="20480" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="2479" name="Constant_290150" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064860" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2480" name="Constant_290148" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064864" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2481" name="__module.model.layers.10.input_layernorm/aten::pow/Power" type="Power" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2103"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="2482" name="Constant_7246" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64" names="2104"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2483" name="__module.model.layers.10.input_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> + <data keep_dims="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2105,variance.41"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2484" name="Constant_290149" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064876" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2485" name="__module.model.layers.10.input_layernorm/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2106"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2486" name="__module.model.layers.10.input_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2487" name="__module.model.layers.10.input_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2107"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2488" name="__module.model.layers.10.input_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2108,2109,hidden_states.303,hidden_states.305"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="2489" name="__module.model.layers.10.input_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2110,2112,hidden_states.307"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="2490" name="self.model.layers.10.self_attn.q_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 128" offset="2209634424" size="13107200" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2491" name="Convert_386227" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2492" name="self.model.layers.10.self_attn.q_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 1" offset="2222741624" size="102400" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2493" name="Convert_386229" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2494" name="self.model.layers.10.self_attn.q_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2495" name="self.model.layers.10.self_attn.q_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="5120, 40, 1" offset="2222844024" size="409600" /> + <output> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2496" name="self.model.layers.10.self_attn.q_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2497" name="Constant_386234" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="792684080" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="2498" name="Reshape_386235" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="2499" name="__module.model.layers.10.self_attn.q_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="2500" name="__module.model.layers.10.self_attn.q_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="2501" name="self.model.layers.10.self_attn.q_proj.bias" type="Const" version="opset1"> + <data element_type="bf16" shape="5120" offset="2223253624" size="10240" /> + <output> + <port id="0" precision="BF16" names="self.model.layers.10.self_attn.q_proj.bias"> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="2502" name="__module.model.layers.10.self_attn.q_proj/prim::PythonOp/ConvertLike_1" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="BF16"> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="2503" name="__module.model.layers.10.self_attn.q_proj/prim::PythonOp/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2122,query_states.21"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="2504" name="Constant_301757" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="792694336" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2505" name="__module.model.layers.10.self_attn/aten::view/Reshape" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2130"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2506" name="__module.model.layers.10.self_attn/aten::transpose/ScatterElementsUpdate" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2507" name="__module.model.layers.10.self_attn/aten::transpose/Transpose" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2131,q.21"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2508" name="__module.model.layers.10.self_attn/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2140"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2509" name="__module.model.layers.10.self_attn/aten::size/ShapeOf_3" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2510" name="__module.model.layers.10.self_attn/aten::size/Constant_3" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="2511" name="__module.model.layers.10.self_attn/aten::size/Gather_3" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="2141,2146" /> + </output> + </layer> + <layer id="2512" name="__module.model.layers.10.self_attn/aten::floor_divide/Divide_1" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" /> + </output> + </layer> + <layer id="2513" name="__module.model.layers.10.self_attn/aten::floor_divide/Floor_1" type="Floor" version="opset1"> + <input> + <port id="0" precision="I64" /> + </input> + <output> + <port id="1" precision="I64" names="2143,2144,2148,2149" /> + </output> + </layer> + <layer id="2514" name="Constant_220695" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2515" name="__module.model.layers.10.self_attn/aten::slice/Reshape_5" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2516" name="__module.model.layers.10.self_attn/aten::slice/Reshape_1" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694676" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2517" name="__module.model.layers.10.self_attn/aten::slice/Reshape_2" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2518" name="__module.model.layers.10.self_attn/aten::slice/Reshape_3" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2519" name="__module.model.layers.10.self_attn/aten::slice/Slice" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="2150,x2.41"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="2520" name="Constant_290152" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1, 1" offset="792694684" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2521" name="__module.model.layers.10.self_attn/aten::neg/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2151"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="2522" name="__module.model.layers.10.self_attn/aten::slice/Reshape_4" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2523" name="__module.model.layers.10.self_attn/aten::slice/Reshape_6" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2524" name="__module.model.layers.10.self_attn/aten::slice/Reshape_7" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2525" name="__module.model.layers.10.self_attn/aten::slice/Slice_1" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="2145"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="2526" name="__module.model.layers.10.self_attn/aten::cat/Concat" type="Concat" version="opset1"> + <data axis="-1" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2153"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2527" name="__module.model.layers.10.self_attn/aten::mul/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2154"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2528" name="__module.model.layers.10.self_attn/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2155"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2529" name="Constant_341035" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="2530" name="Constant_341028" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="12" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2531" name="Constant_341030" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2532" name="Constant_341032" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="20" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2533" name="Concat_341033" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2534" name="Broadcast_341036" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32" /> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2535" name="ReadValue_333084" type="ReadValue" version="opset6"> + <data variable_id="past_key_values.10.keypresent.10.key" variable_type="f32" variable_shape="?,8,?,128" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="past_key_values.10.key"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2536" name="Constant_325369" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="2537" name="Gather_325370" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2538" name="self.model.layers.10.self_attn.k_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 128" offset="2223263864" size="2621440" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2539" name="Convert_387187" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2540" name="self.model.layers.10.self_attn.k_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 1" offset="2225885304" size="20480" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2541" name="Convert_387189" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2542" name="self.model.layers.10.self_attn.k_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2543" name="self.model.layers.10.self_attn.k_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="1024, 40, 1" offset="2225905784" size="81920" /> + <output> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2544" name="self.model.layers.10.self_attn.k_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2545" name="Constant_387194" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795418528" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="2546" name="Reshape_387195" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="2547" name="__module.model.layers.10.self_attn.k_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="2548" name="__module.model.layers.10.self_attn.k_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="2549" name="self.model.layers.10.self_attn.k_proj.bias" type="Const" version="opset1"> + <data element_type="bf16" shape="1024" offset="2225987704" size="2048" /> + <output> + <port id="0" precision="BF16" names="self.model.layers.10.self_attn.k_proj.bias"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="2550" name="__module.model.layers.10.self_attn.k_proj/prim::PythonOp/ConvertLike_1" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="BF16"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="2551" name="__module.model.layers.10.self_attn.k_proj/prim::PythonOp/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2125,key_states.45"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="2552" name="Constant_301758" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420592" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2553" name="__module.model.layers.10.self_attn/aten::view/Reshape_1" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2133"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2554" name="__module.model.layers.10.self_attn/aten::transpose/ScatterElementsUpdate_1" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2555" name="__module.model.layers.10.self_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2134,k.21"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2556" name="__module.model.layers.10.self_attn/aten::mul/Multiply_2" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2156"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2557" name="__module.model.layers.10.self_attn/aten::size/ShapeOf_5" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2558" name="__module.model.layers.10.self_attn/aten::size/Constant_5" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="2559" name="__module.model.layers.10.self_attn/aten::size/Gather_5" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="2157,2162" /> + </output> + </layer> + <layer id="2560" name="__module.model.layers.10.self_attn/aten::floor_divide/Divide_3" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" /> + </output> + </layer> + <layer id="2561" name="__module.model.layers.10.self_attn/aten::floor_divide/Floor_3" type="Floor" version="opset1"> + <input> + <port id="0" precision="I64" /> + </input> + <output> + <port id="1" precision="I64" names="2159,2160,2164,2165" /> + </output> + </layer> + <layer id="2562" name="Constant_220696" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2563" name="__module.model.layers.10.self_attn/aten::slice/Reshape_13" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2564" name="__module.model.layers.10.self_attn/aten::slice/Reshape_9" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694676" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2565" name="__module.model.layers.10.self_attn/aten::slice/Reshape_10" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2566" name="__module.model.layers.10.self_attn/aten::slice/Reshape_11" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2567" name="__module.model.layers.10.self_attn/aten::slice/Slice_2" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="2166,x2.43"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="2568" name="Constant_290153" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1, 1" offset="792694684" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2569" name="__module.model.layers.10.self_attn/aten::neg/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2167"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="2570" name="__module.model.layers.10.self_attn/aten::slice/Reshape_12" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2571" name="__module.model.layers.10.self_attn/aten::slice/Reshape_14" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2572" name="__module.model.layers.10.self_attn/aten::slice/Reshape_15" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2573" name="__module.model.layers.10.self_attn/aten::slice/Slice_3" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="2161"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="2574" name="__module.model.layers.10.self_attn/aten::cat/Concat_1" type="Concat" version="opset1"> + <data axis="-1" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2169"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2575" name="__module.model.layers.10.self_attn/aten::mul/Multiply_3" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2170"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2576" name="__module.model.layers.10.self_attn/aten::add/Add_1" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2171"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2577" name="__module.model.layers.10.self_attn/aten::cat/Concat_2" type="Concat" version="opset1"> + <data axis="-2" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="present.10.key"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2578" name="__module.model.layers.10.self_attn/aten::unsqueeze/Unsqueeze_2" type="Unsqueeze" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="FP32" names="2183,2184,2185"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2579" name="__module.model.layers.10.self_attn/aten::size/ShapeOf_6" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2580" name="Constant_302414" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="938477672" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="2581" name="Constant_302415" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="2582" name="Gather_302416" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="2583" name="Constant_268194" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="795420624" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2584" name="Constant_276541" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795420632" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="2585" name="Constant_276542" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="2586" name="Gather_276543" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="2587" name="__module.model.layers.10.self_attn/prim::ListConstruct/Concat_2" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="3" precision="I64" names="2186"> + <dim>5</dim> + </port> + </output> + </layer> + <layer id="2588" name="__module.model.layers.10.self_attn/aten::expand/Broadcast" type="Broadcast" version="opset3"> + <data mode="bidirectional" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>5</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2187,hidden_states.311"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2589" name="Constant_301759" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420648" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2590" name="__module.model.layers.10.self_attn/aten::reshape/Reshape" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2191,key_states.47"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2591" name="Constant_341048" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="2592" name="Constant_341041" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="12" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2593" name="Constant_341043" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2594" name="Constant_341045" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="20" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2595" name="Concat_341046" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2596" name="Broadcast_341049" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32" /> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2597" name="ReadValue_333086" type="ReadValue" version="opset6"> + <data variable_id="past_key_values.10.valuepresent.10.value" variable_type="f32" variable_shape="?,8,?,128" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="past_key_values.10.value"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2598" name="Constant_325372" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="2599" name="Gather_325373" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2600" name="self.model.layers.10.self_attn.v_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 128" offset="2225989752" size="2621440" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2601" name="Convert_387197" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2602" name="self.model.layers.10.self_attn.v_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 1" offset="2228611192" size="20480" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2603" name="Convert_387199" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2604" name="self.model.layers.10.self_attn.v_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2605" name="self.model.layers.10.self_attn.v_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="1024, 40, 1" offset="2228631672" size="81920" /> + <output> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2606" name="self.model.layers.10.self_attn.v_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2607" name="Constant_387204" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795418528" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="2608" name="Reshape_387205" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="2609" name="__module.model.layers.10.self_attn.v_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="2610" name="__module.model.layers.10.self_attn.v_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="2611" name="self.model.layers.10.self_attn.v_proj.bias" type="Const" version="opset1"> + <data element_type="bf16" shape="1024" offset="2228713592" size="2048" /> + <output> + <port id="0" precision="BF16" names="self.model.layers.10.self_attn.v_proj.bias"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="2612" name="__module.model.layers.10.self_attn.v_proj/prim::PythonOp/ConvertLike_1" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="BF16"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="2613" name="__module.model.layers.10.self_attn.v_proj/prim::PythonOp/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2128,value_states.21"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="2614" name="Constant_301760" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420592" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2615" name="__module.model.layers.10.self_attn/aten::view/Reshape_2" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2136"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2616" name="__module.model.layers.10.self_attn/aten::transpose/ScatterElementsUpdate_2" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2617" name="__module.model.layers.10.self_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2137"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2618" name="__module.model.layers.10.self_attn/aten::cat/Concat_3" type="Concat" version="opset1"> + <data axis="-2" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="present.10.value"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2619" name="__module.model.layers.10.self_attn/aten::unsqueeze/Unsqueeze_3" type="Unsqueeze" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="FP32" names="2199,2200,2201"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2620" name="__module.model.layers.10.self_attn/aten::size/ShapeOf_10" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2621" name="Constant_302145" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2622" name="__module.model.layers.10.self_attn/aten::size/Constant_11" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="2623" name="__module.model.layers.10.self_attn/aten::size/Gather_11" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="2193"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2624" name="Constant_268212" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="795420624" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2625" name="Constant_276551" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795420632" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="2626" name="Constant_276552" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="2627" name="Gather_276553" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="2628" name="__module.model.layers.10.self_attn/prim::ListConstruct/Concat_5" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="4" precision="I64" names="2202"> + <dim>5</dim> + </port> + </output> + </layer> + <layer id="2629" name="__module.model.layers.10.self_attn/aten::expand/Broadcast_1" type="Broadcast" version="opset3"> + <data mode="bidirectional" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>5</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2203,hidden_states.315"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2630" name="Constant_301761" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420648" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2631" name="__module.model.layers.10.self_attn/aten::reshape/Reshape_1" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2207"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2632" name="__module.model.layers.10.self_attn/aten::slice/Reshape_60" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2633" name="ShapeOf_298440" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2634" name="Constant_298441" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694668" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2635" name="Constant_298442" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="2636" name="Gather_298443" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2637" name="ShapeOf_298444" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2638" name="Constant_298445" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694668" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2639" name="Constant_298446" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="2640" name="Gather_298447" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2641" name="Add_298448" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64" names="2208"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2642" name="__module.model.layers.10.self_attn/aten::slice/Reshape_62" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2643" name="__module.model.layers.10.self_attn/aten::slice/Reshape_63" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2644" name="__module.model.layers.10.self_attn/aten::slice/Slice_15" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="2212"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="2645" name="__module.model.layers.10.self_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> + <data causal="false" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="2213,attn_output.41"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2646" name="__module.model.layers.10.self_attn/aten::transpose/ScatterElementsUpdate_3" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2647" name="__module.model.layers.10.self_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2214"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2648" name="Constant_301762" type="Const" version="opset1"> + <data element_type="i64" shape="3" offset="798146608" size="24" /> + <output> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="2649" name="__module.model.layers.10.self_attn/aten::view/Reshape_3" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>3</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2217"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="2650" name="self.model.layers.10.self_attn.o_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 128" offset="2228715640" size="13107200" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2651" name="Convert_386237" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2652" name="self.model.layers.10.self_attn.o_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 1" offset="2241822840" size="102400" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2653" name="Convert_386239" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2654" name="self.model.layers.10.self_attn.o_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2655" name="self.model.layers.10.self_attn.o_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="5120, 40, 1" offset="2241925240" size="409600" /> + <output> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2656" name="self.model.layers.10.self_attn.o_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2657" name="Constant_386244" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="792684080" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="2658" name="Reshape_386245" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="2659" name="__module.model.layers.10.self_attn.o_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="2660" name="__module.model.layers.10.self_attn.o_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2219,2221,hidden_states.317"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="2661" name="__module.model.layers.10/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2224,2226,2237,hidden_states.319,hidden_states.321"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="2662" name="Constant_290157" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 5120" offset="2242334840" size="20480" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="2663" name="Constant_290156" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064860" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2664" name="Constant_290154" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064864" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2665" name="__module.model.layers.10.post_attention_layernorm/aten::pow/Power" type="Power" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2227"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="2666" name="Constant_7844" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64" names="2228"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2667" name="__module.model.layers.10.post_attention_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> + <data keep_dims="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2229,variance.43"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2668" name="Constant_290155" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064876" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2669" name="__module.model.layers.10.post_attention_layernorm/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2230"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2670" name="__module.model.layers.10.post_attention_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2671" name="__module.model.layers.10.post_attention_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2231"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2672" name="__module.model.layers.10.post_attention_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2232,2233,hidden_states.323,hidden_states.325"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="2673" name="__module.model.layers.10.post_attention_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2234,2236"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="2674" name="self.model.layers.10.mlp.gate_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 128" offset="2242355320" size="35389440" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2675" name="Convert_384897" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2676" name="self.model.layers.10.mlp.gate_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 1" offset="2277744760" size="276480" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2677" name="Convert_384899" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2678" name="self.model.layers.10.mlp.gate_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2679" name="self.model.layers.10.mlp.gate_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="13824, 40, 1" offset="2278021240" size="1105920" /> + <output> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2680" name="self.model.layers.10.mlp.gate_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2681" name="Constant_384904" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="848558152" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="2682" name="Reshape_384905" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="2683" name="__module.model.layers.10.mlp.gate_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="2684" name="__module.model.layers.10.mlp.gate_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2242,input.21"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="2685" name="__module.model.layers.10.mlp.act_fn/aten::silu/Swish" type="Swish" version="opset4"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="2243"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="2686" name="self.model.layers.10.mlp.up_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 128" offset="2279127160" size="35389440" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2687" name="Convert_384887" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2688" name="self.model.layers.10.mlp.up_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 1" offset="2314516600" size="276480" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2689" name="Convert_384889" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2690" name="self.model.layers.10.mlp.up_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2691" name="self.model.layers.10.mlp.up_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="13824, 40, 1" offset="2314793080" size="1105920" /> + <output> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2692" name="self.model.layers.10.mlp.up_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2693" name="Constant_384894" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="848558152" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="2694" name="Reshape_384895" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="2695" name="__module.model.layers.10.mlp.up_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="2696" name="__module.model.layers.10.mlp.up_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2245"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="2697" name="__module.model.layers.10.mlp/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2246"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="2698" name="self.model.layers.10.mlp.down_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 108, 128" offset="2315899000" size="35389440" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2699" name="Convert_384907" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2700" name="self.model.layers.10.mlp.down_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 108, 1" offset="2351288440" size="276480" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2701" name="Convert_384909" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2702" name="self.model.layers.10.mlp.down_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2703" name="self.model.layers.10.mlp.down_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="5120, 108, 1" offset="2351564920" size="1105920" /> + <output> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2704" name="self.model.layers.10.mlp.down_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2705" name="Constant_384914" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="922101848" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="2706" name="Reshape_384915" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="2707" name="__module.model.layers.10.mlp.down_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="2708" name="__module.model.layers.10.mlp.down_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2248,hidden_states.327"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="2709" name="__module.model.layers.10/aten::add/Add_1" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2249,2251,2259,2270,hidden_states.329,hidden_states.331"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="2710" name="Constant_290161" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 5120" offset="2352670840" size="20480" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="2711" name="Constant_290160" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064860" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2712" name="Constant_290158" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064864" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2713" name="__module.model.layers.11.input_layernorm/aten::pow/Power" type="Power" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2260"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="2714" name="Constant_7918" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64" names="2261"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2715" name="__module.model.layers.11.input_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> + <data keep_dims="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2262,variance.45"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2716" name="Constant_290159" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064876" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2717" name="__module.model.layers.11.input_layernorm/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2263"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2718" name="__module.model.layers.11.input_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2719" name="__module.model.layers.11.input_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2264"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2720" name="__module.model.layers.11.input_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2265,2266,hidden_states.333,hidden_states.335"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="2721" name="__module.model.layers.11.input_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2267,2269,hidden_states.337"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="2722" name="self.model.layers.11.self_attn.q_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 128" offset="2352691320" size="13107200" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2723" name="Convert_386247" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2724" name="self.model.layers.11.self_attn.q_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 1" offset="2365798520" size="102400" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2725" name="Convert_386249" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2726" name="self.model.layers.11.self_attn.q_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2727" name="self.model.layers.11.self_attn.q_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="5120, 40, 1" offset="2365900920" size="409600" /> + <output> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2728" name="self.model.layers.11.self_attn.q_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2729" name="Constant_386254" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="792684080" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="2730" name="Reshape_386255" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="2731" name="__module.model.layers.11.self_attn.q_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="2732" name="__module.model.layers.11.self_attn.q_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="2733" name="self.model.layers.11.self_attn.q_proj.bias" type="Const" version="opset1"> + <data element_type="bf16" shape="5120" offset="2366310520" size="10240" /> + <output> + <port id="0" precision="BF16" names="self.model.layers.11.self_attn.q_proj.bias"> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="2734" name="__module.model.layers.11.self_attn.q_proj/prim::PythonOp/ConvertLike_1" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="BF16"> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="2735" name="__module.model.layers.11.self_attn.q_proj/prim::PythonOp/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2279,query_states.23"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="2736" name="Constant_301763" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="792694336" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2737" name="__module.model.layers.11.self_attn/aten::view/Reshape" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2287"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2738" name="__module.model.layers.11.self_attn/aten::transpose/ScatterElementsUpdate" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2739" name="__module.model.layers.11.self_attn/aten::transpose/Transpose" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2288,q.23"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2740" name="__module.model.layers.11.self_attn/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2297"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2741" name="__module.model.layers.11.self_attn/aten::size/ShapeOf_3" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2742" name="__module.model.layers.11.self_attn/aten::size/Constant_3" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="2743" name="__module.model.layers.11.self_attn/aten::size/Gather_3" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="2298,2303" /> + </output> + </layer> + <layer id="2744" name="__module.model.layers.11.self_attn/aten::floor_divide/Divide_1" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" /> + </output> + </layer> + <layer id="2745" name="__module.model.layers.11.self_attn/aten::floor_divide/Floor_1" type="Floor" version="opset1"> + <input> + <port id="0" precision="I64" /> + </input> + <output> + <port id="1" precision="I64" names="2300,2301,2305,2306" /> + </output> + </layer> + <layer id="2746" name="Constant_220710" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2747" name="__module.model.layers.11.self_attn/aten::slice/Reshape_5" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2748" name="__module.model.layers.11.self_attn/aten::slice/Reshape_1" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694676" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2749" name="__module.model.layers.11.self_attn/aten::slice/Reshape_2" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2750" name="__module.model.layers.11.self_attn/aten::slice/Reshape_3" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2751" name="__module.model.layers.11.self_attn/aten::slice/Slice" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="2307,x2.45"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="2752" name="Constant_290162" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1, 1" offset="792694684" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2753" name="__module.model.layers.11.self_attn/aten::neg/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2308"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="2754" name="__module.model.layers.11.self_attn/aten::slice/Reshape_4" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2755" name="__module.model.layers.11.self_attn/aten::slice/Reshape_6" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2756" name="__module.model.layers.11.self_attn/aten::slice/Reshape_7" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2757" name="__module.model.layers.11.self_attn/aten::slice/Slice_1" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="2302"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="2758" name="__module.model.layers.11.self_attn/aten::cat/Concat" type="Concat" version="opset1"> + <data axis="-1" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2310"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2759" name="__module.model.layers.11.self_attn/aten::mul/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2311"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2760" name="__module.model.layers.11.self_attn/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2312"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2761" name="Constant_341061" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="2762" name="Constant_341054" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="12" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2763" name="Constant_341056" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2764" name="Constant_341058" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="20" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2765" name="Concat_341059" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2766" name="Broadcast_341062" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32" /> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2767" name="ReadValue_333088" type="ReadValue" version="opset6"> + <data variable_id="past_key_values.11.keypresent.11.key" variable_type="f32" variable_shape="?,8,?,128" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="past_key_values.11.key"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2768" name="Constant_325375" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="2769" name="Gather_325376" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2770" name="self.model.layers.11.self_attn.k_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 128" offset="2366320760" size="2621440" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2771" name="Convert_387207" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2772" name="self.model.layers.11.self_attn.k_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 1" offset="2368942200" size="20480" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2773" name="Convert_387209" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2774" name="self.model.layers.11.self_attn.k_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2775" name="self.model.layers.11.self_attn.k_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="1024, 40, 1" offset="2368962680" size="81920" /> + <output> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2776" name="self.model.layers.11.self_attn.k_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2777" name="Constant_387214" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795418528" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="2778" name="Reshape_387215" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="2779" name="__module.model.layers.11.self_attn.k_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="2780" name="__module.model.layers.11.self_attn.k_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="2781" name="self.model.layers.11.self_attn.k_proj.bias" type="Const" version="opset1"> + <data element_type="bf16" shape="1024" offset="2369044600" size="2048" /> + <output> + <port id="0" precision="BF16" names="self.model.layers.11.self_attn.k_proj.bias"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="2782" name="__module.model.layers.11.self_attn.k_proj/prim::PythonOp/ConvertLike_1" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="BF16"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="2783" name="__module.model.layers.11.self_attn.k_proj/prim::PythonOp/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2282,key_states.49"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="2784" name="Constant_301764" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420592" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2785" name="__module.model.layers.11.self_attn/aten::view/Reshape_1" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2290"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2786" name="__module.model.layers.11.self_attn/aten::transpose/ScatterElementsUpdate_1" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2787" name="__module.model.layers.11.self_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2291,k.23"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2788" name="__module.model.layers.11.self_attn/aten::mul/Multiply_2" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2313"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2789" name="__module.model.layers.11.self_attn/aten::size/ShapeOf_5" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2790" name="__module.model.layers.11.self_attn/aten::size/Constant_5" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="2791" name="__module.model.layers.11.self_attn/aten::size/Gather_5" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="2314,2319" /> + </output> + </layer> + <layer id="2792" name="__module.model.layers.11.self_attn/aten::floor_divide/Divide_3" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" /> + </output> + </layer> + <layer id="2793" name="__module.model.layers.11.self_attn/aten::floor_divide/Floor_3" type="Floor" version="opset1"> + <input> + <port id="0" precision="I64" /> + </input> + <output> + <port id="1" precision="I64" names="2316,2317,2321,2322" /> + </output> + </layer> + <layer id="2794" name="Constant_220711" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2795" name="__module.model.layers.11.self_attn/aten::slice/Reshape_13" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2796" name="__module.model.layers.11.self_attn/aten::slice/Reshape_9" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694676" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2797" name="__module.model.layers.11.self_attn/aten::slice/Reshape_10" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2798" name="__module.model.layers.11.self_attn/aten::slice/Reshape_11" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2799" name="__module.model.layers.11.self_attn/aten::slice/Slice_2" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="2323,x2.47"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="2800" name="Constant_290163" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1, 1" offset="792694684" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2801" name="__module.model.layers.11.self_attn/aten::neg/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2324"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="2802" name="__module.model.layers.11.self_attn/aten::slice/Reshape_12" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2803" name="__module.model.layers.11.self_attn/aten::slice/Reshape_14" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2804" name="__module.model.layers.11.self_attn/aten::slice/Reshape_15" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2805" name="__module.model.layers.11.self_attn/aten::slice/Slice_3" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="2318"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="2806" name="__module.model.layers.11.self_attn/aten::cat/Concat_1" type="Concat" version="opset1"> + <data axis="-1" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2326"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2807" name="__module.model.layers.11.self_attn/aten::mul/Multiply_3" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2327"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2808" name="__module.model.layers.11.self_attn/aten::add/Add_1" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2328"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2809" name="__module.model.layers.11.self_attn/aten::cat/Concat_2" type="Concat" version="opset1"> + <data axis="-2" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="present.11.key"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2810" name="__module.model.layers.11.self_attn/aten::unsqueeze/Unsqueeze_2" type="Unsqueeze" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="FP32" names="2340,2341,2342"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2811" name="__module.model.layers.11.self_attn/aten::size/ShapeOf_6" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2812" name="Constant_302419" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="938477672" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="2813" name="Constant_302420" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="2814" name="Gather_302421" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="2815" name="Constant_268230" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="795420624" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2816" name="Constant_276576" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795420632" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="2817" name="Constant_276577" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="2818" name="Gather_276578" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="2819" name="__module.model.layers.11.self_attn/prim::ListConstruct/Concat_2" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="3" precision="I64" names="2343"> + <dim>5</dim> + </port> + </output> + </layer> + <layer id="2820" name="__module.model.layers.11.self_attn/aten::expand/Broadcast" type="Broadcast" version="opset3"> + <data mode="bidirectional" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>5</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2344,hidden_states.341"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2821" name="Constant_301765" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420648" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2822" name="__module.model.layers.11.self_attn/aten::reshape/Reshape" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2348,key_states.51"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2823" name="Constant_341074" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="2824" name="Constant_341067" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="12" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2825" name="Constant_341069" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2826" name="Constant_341071" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="20" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2827" name="Concat_341072" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2828" name="Broadcast_341075" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32" /> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2829" name="ReadValue_333090" type="ReadValue" version="opset6"> + <data variable_id="past_key_values.11.valuepresent.11.value" variable_type="f32" variable_shape="?,8,?,128" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="past_key_values.11.value"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2830" name="Constant_325378" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="2831" name="Gather_325379" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2832" name="self.model.layers.11.self_attn.v_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 128" offset="2369046648" size="2621440" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2833" name="Convert_387217" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2834" name="self.model.layers.11.self_attn.v_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 1" offset="2371668088" size="20480" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2835" name="Convert_387219" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2836" name="self.model.layers.11.self_attn.v_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2837" name="self.model.layers.11.self_attn.v_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="1024, 40, 1" offset="2371688568" size="81920" /> + <output> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2838" name="self.model.layers.11.self_attn.v_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2839" name="Constant_387224" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795418528" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="2840" name="Reshape_387225" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="2841" name="__module.model.layers.11.self_attn.v_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="2842" name="__module.model.layers.11.self_attn.v_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="2843" name="self.model.layers.11.self_attn.v_proj.bias" type="Const" version="opset1"> + <data element_type="bf16" shape="1024" offset="2371770488" size="2048" /> + <output> + <port id="0" precision="BF16" names="self.model.layers.11.self_attn.v_proj.bias"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="2844" name="__module.model.layers.11.self_attn.v_proj/prim::PythonOp/ConvertLike_1" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="BF16"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="2845" name="__module.model.layers.11.self_attn.v_proj/prim::PythonOp/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2285,value_states.23"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="2846" name="Constant_301766" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420592" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2847" name="__module.model.layers.11.self_attn/aten::view/Reshape_2" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2293"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2848" name="__module.model.layers.11.self_attn/aten::transpose/ScatterElementsUpdate_2" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2849" name="__module.model.layers.11.self_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2294"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2850" name="__module.model.layers.11.self_attn/aten::cat/Concat_3" type="Concat" version="opset1"> + <data axis="-2" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="present.11.value"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2851" name="__module.model.layers.11.self_attn/aten::unsqueeze/Unsqueeze_3" type="Unsqueeze" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="FP32" names="2356,2357,2358"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2852" name="__module.model.layers.11.self_attn/aten::size/ShapeOf_10" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2853" name="Constant_302151" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2854" name="__module.model.layers.11.self_attn/aten::size/Constant_11" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="2855" name="__module.model.layers.11.self_attn/aten::size/Gather_11" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="2350"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2856" name="Constant_268248" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="795420624" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2857" name="Constant_276586" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795420632" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="2858" name="Constant_276587" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="2859" name="Gather_276588" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="2860" name="__module.model.layers.11.self_attn/prim::ListConstruct/Concat_5" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="4" precision="I64" names="2359"> + <dim>5</dim> + </port> + </output> + </layer> + <layer id="2861" name="__module.model.layers.11.self_attn/aten::expand/Broadcast_1" type="Broadcast" version="opset3"> + <data mode="bidirectional" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>5</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2360,hidden_states.345"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2862" name="Constant_301767" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420648" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2863" name="__module.model.layers.11.self_attn/aten::reshape/Reshape_1" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2364"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2864" name="__module.model.layers.11.self_attn/aten::slice/Reshape_60" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2865" name="ShapeOf_298526" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2866" name="Constant_298527" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694668" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2867" name="Constant_298528" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="2868" name="Gather_298529" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2869" name="ShapeOf_298530" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2870" name="Constant_298531" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694668" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2871" name="Constant_298532" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="2872" name="Gather_298533" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2873" name="Add_298534" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64" names="2365"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2874" name="__module.model.layers.11.self_attn/aten::slice/Reshape_62" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2875" name="__module.model.layers.11.self_attn/aten::slice/Reshape_63" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2876" name="__module.model.layers.11.self_attn/aten::slice/Slice_15" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="2369"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="2877" name="__module.model.layers.11.self_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> + <data causal="false" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="2370,attn_output.45"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2878" name="__module.model.layers.11.self_attn/aten::transpose/ScatterElementsUpdate_3" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2879" name="__module.model.layers.11.self_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2371"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2880" name="Constant_301768" type="Const" version="opset1"> + <data element_type="i64" shape="3" offset="798146608" size="24" /> + <output> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="2881" name="__module.model.layers.11.self_attn/aten::view/Reshape_3" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>3</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2374"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="2882" name="self.model.layers.11.self_attn.o_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 128" offset="2371772536" size="13107200" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2883" name="Convert_386257" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2884" name="self.model.layers.11.self_attn.o_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 1" offset="2384879736" size="102400" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2885" name="Convert_386259" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2886" name="self.model.layers.11.self_attn.o_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2887" name="self.model.layers.11.self_attn.o_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="5120, 40, 1" offset="2384982136" size="409600" /> + <output> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2888" name="self.model.layers.11.self_attn.o_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2889" name="Constant_386264" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="792684080" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="2890" name="Reshape_386265" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="2891" name="__module.model.layers.11.self_attn.o_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="2892" name="__module.model.layers.11.self_attn.o_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2376,2378,hidden_states.347"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="2893" name="__module.model.layers.11/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2381,2383,2394,hidden_states.349,hidden_states.351"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="2894" name="Constant_290167" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 5120" offset="2385391736" size="20480" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="2895" name="Constant_290166" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064860" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2896" name="Constant_290164" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064864" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2897" name="__module.model.layers.11.post_attention_layernorm/aten::pow/Power" type="Power" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2384"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="2898" name="Constant_8516" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64" names="2385"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2899" name="__module.model.layers.11.post_attention_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> + <data keep_dims="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2386,variance.47"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2900" name="Constant_290165" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064876" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2901" name="__module.model.layers.11.post_attention_layernorm/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2387"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2902" name="__module.model.layers.11.post_attention_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2903" name="__module.model.layers.11.post_attention_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2388"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2904" name="__module.model.layers.11.post_attention_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2389,2390,hidden_states.353,hidden_states.355"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="2905" name="__module.model.layers.11.post_attention_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2391,2393"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="2906" name="self.model.layers.11.mlp.gate_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 128" offset="2385412216" size="35389440" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2907" name="Convert_384927" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2908" name="self.model.layers.11.mlp.gate_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 1" offset="2420801656" size="276480" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2909" name="Convert_384929" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2910" name="self.model.layers.11.mlp.gate_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2911" name="self.model.layers.11.mlp.gate_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="13824, 40, 1" offset="2421078136" size="1105920" /> + <output> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2912" name="self.model.layers.11.mlp.gate_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2913" name="Constant_384934" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="848558152" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="2914" name="Reshape_384935" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="2915" name="__module.model.layers.11.mlp.gate_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="2916" name="__module.model.layers.11.mlp.gate_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2399,input.23"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="2917" name="__module.model.layers.11.mlp.act_fn/aten::silu/Swish" type="Swish" version="opset4"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="2400"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="2918" name="self.model.layers.11.mlp.up_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 128" offset="2422184056" size="35389440" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2919" name="Convert_384917" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2920" name="self.model.layers.11.mlp.up_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 1" offset="2457573496" size="276480" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2921" name="Convert_384919" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2922" name="self.model.layers.11.mlp.up_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2923" name="self.model.layers.11.mlp.up_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="13824, 40, 1" offset="2457849976" size="1105920" /> + <output> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2924" name="self.model.layers.11.mlp.up_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2925" name="Constant_384924" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="848558152" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="2926" name="Reshape_384925" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="2927" name="__module.model.layers.11.mlp.up_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="2928" name="__module.model.layers.11.mlp.up_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2402"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="2929" name="__module.model.layers.11.mlp/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2403"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="2930" name="self.model.layers.11.mlp.down_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 108, 128" offset="2458955896" size="35389440" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2931" name="Convert_384937" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2932" name="self.model.layers.11.mlp.down_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 108, 1" offset="2494345336" size="276480" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2933" name="Convert_384939" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2934" name="self.model.layers.11.mlp.down_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2935" name="self.model.layers.11.mlp.down_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="5120, 108, 1" offset="2494621816" size="1105920" /> + <output> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2936" name="self.model.layers.11.mlp.down_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2937" name="Constant_384944" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="922101848" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="2938" name="Reshape_384945" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="2939" name="__module.model.layers.11.mlp.down_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="2940" name="__module.model.layers.11.mlp.down_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2405,hidden_states.357"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="2941" name="__module.model.layers.11/aten::add/Add_1" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2406,2408,2416,2427,hidden_states.359,hidden_states.361"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="2942" name="Constant_290171" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 5120" offset="2495727736" size="20480" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="2943" name="Constant_290170" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064860" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2944" name="Constant_290168" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064864" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2945" name="__module.model.layers.12.input_layernorm/aten::pow/Power" type="Power" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2417"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="2946" name="Constant_8590" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64" names="2418"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2947" name="__module.model.layers.12.input_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> + <data keep_dims="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2419,variance.49"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2948" name="Constant_290169" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064876" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2949" name="__module.model.layers.12.input_layernorm/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2420"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2950" name="__module.model.layers.12.input_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2951" name="__module.model.layers.12.input_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2421"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2952" name="__module.model.layers.12.input_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2422,2423,hidden_states.363,hidden_states.365"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="2953" name="__module.model.layers.12.input_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2424,2426,hidden_states.367"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="2954" name="self.model.layers.12.self_attn.q_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 128" offset="2495748216" size="13107200" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2955" name="Convert_386267" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2956" name="self.model.layers.12.self_attn.q_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 1" offset="2508855416" size="102400" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2957" name="Convert_386269" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2958" name="self.model.layers.12.self_attn.q_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2959" name="self.model.layers.12.self_attn.q_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="5120, 40, 1" offset="2508957816" size="409600" /> + <output> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2960" name="self.model.layers.12.self_attn.q_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2961" name="Constant_386274" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="792684080" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="2962" name="Reshape_386275" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="2963" name="__module.model.layers.12.self_attn.q_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="2964" name="__module.model.layers.12.self_attn.q_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="2965" name="self.model.layers.12.self_attn.q_proj.bias" type="Const" version="opset1"> + <data element_type="bf16" shape="5120" offset="2509367416" size="10240" /> + <output> + <port id="0" precision="BF16" names="self.model.layers.12.self_attn.q_proj.bias"> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="2966" name="__module.model.layers.12.self_attn.q_proj/prim::PythonOp/ConvertLike_1" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="BF16"> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="2967" name="__module.model.layers.12.self_attn.q_proj/prim::PythonOp/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2436,query_states.25"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="2968" name="Constant_301769" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="792694336" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2969" name="__module.model.layers.12.self_attn/aten::view/Reshape" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2444"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2970" name="__module.model.layers.12.self_attn/aten::transpose/ScatterElementsUpdate" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2971" name="__module.model.layers.12.self_attn/aten::transpose/Transpose" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2445,q.25"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2972" name="__module.model.layers.12.self_attn/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2454"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2973" name="__module.model.layers.12.self_attn/aten::size/ShapeOf_3" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2974" name="__module.model.layers.12.self_attn/aten::size/Constant_3" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="2975" name="__module.model.layers.12.self_attn/aten::size/Gather_3" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="2455,2460" /> + </output> + </layer> + <layer id="2976" name="__module.model.layers.12.self_attn/aten::floor_divide/Divide_1" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" /> + </output> + </layer> + <layer id="2977" name="__module.model.layers.12.self_attn/aten::floor_divide/Floor_1" type="Floor" version="opset1"> + <input> + <port id="0" precision="I64" /> + </input> + <output> + <port id="1" precision="I64" names="2457,2458,2462,2463" /> + </output> + </layer> + <layer id="2978" name="Constant_220725" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2979" name="__module.model.layers.12.self_attn/aten::slice/Reshape_5" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2980" name="__module.model.layers.12.self_attn/aten::slice/Reshape_1" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694676" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2981" name="__module.model.layers.12.self_attn/aten::slice/Reshape_2" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2982" name="__module.model.layers.12.self_attn/aten::slice/Reshape_3" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2983" name="__module.model.layers.12.self_attn/aten::slice/Slice" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="2464,x2.49"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="2984" name="Constant_290172" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1, 1" offset="792694684" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2985" name="__module.model.layers.12.self_attn/aten::neg/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2465"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="2986" name="__module.model.layers.12.self_attn/aten::slice/Reshape_4" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2987" name="__module.model.layers.12.self_attn/aten::slice/Reshape_6" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2988" name="__module.model.layers.12.self_attn/aten::slice/Reshape_7" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2989" name="__module.model.layers.12.self_attn/aten::slice/Slice_1" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="2459"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="2990" name="__module.model.layers.12.self_attn/aten::cat/Concat" type="Concat" version="opset1"> + <data axis="-1" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2467"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2991" name="__module.model.layers.12.self_attn/aten::mul/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2468"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2992" name="__module.model.layers.12.self_attn/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2469"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2993" name="Constant_341087" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="2994" name="Constant_341080" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="12" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2995" name="Constant_341082" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2996" name="Constant_341084" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="20" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="2997" name="Concat_341085" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="2998" name="Broadcast_341088" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32" /> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2999" name="ReadValue_333092" type="ReadValue" version="opset6"> + <data variable_id="past_key_values.12.keypresent.12.key" variable_type="f32" variable_shape="?,8,?,128" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="past_key_values.12.key"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3000" name="Constant_325381" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="3001" name="Gather_325382" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3002" name="self.model.layers.12.self_attn.k_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 128" offset="2509377656" size="2621440" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3003" name="Convert_387227" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3004" name="self.model.layers.12.self_attn.k_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 1" offset="2511999096" size="20480" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3005" name="Convert_387229" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3006" name="self.model.layers.12.self_attn.k_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3007" name="self.model.layers.12.self_attn.k_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="1024, 40, 1" offset="2512019576" size="81920" /> + <output> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3008" name="self.model.layers.12.self_attn.k_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3009" name="Constant_387234" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795418528" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="3010" name="Reshape_387235" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="3011" name="__module.model.layers.12.self_attn.k_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="3012" name="__module.model.layers.12.self_attn.k_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="3013" name="self.model.layers.12.self_attn.k_proj.bias" type="Const" version="opset1"> + <data element_type="bf16" shape="1024" offset="2512101496" size="2048" /> + <output> + <port id="0" precision="BF16" names="self.model.layers.12.self_attn.k_proj.bias"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="3014" name="__module.model.layers.12.self_attn.k_proj/prim::PythonOp/ConvertLike_1" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="BF16"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="3015" name="__module.model.layers.12.self_attn.k_proj/prim::PythonOp/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2439,key_states.53"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="3016" name="Constant_301770" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420592" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3017" name="__module.model.layers.12.self_attn/aten::view/Reshape_1" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2447"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3018" name="__module.model.layers.12.self_attn/aten::transpose/ScatterElementsUpdate_1" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3019" name="__module.model.layers.12.self_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2448,k.25"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3020" name="__module.model.layers.12.self_attn/aten::mul/Multiply_2" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2470"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3021" name="__module.model.layers.12.self_attn/aten::size/ShapeOf_5" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3022" name="__module.model.layers.12.self_attn/aten::size/Constant_5" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="3023" name="__module.model.layers.12.self_attn/aten::size/Gather_5" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="2471,2476" /> + </output> + </layer> + <layer id="3024" name="__module.model.layers.12.self_attn/aten::floor_divide/Divide_3" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" /> + </output> + </layer> + <layer id="3025" name="__module.model.layers.12.self_attn/aten::floor_divide/Floor_3" type="Floor" version="opset1"> + <input> + <port id="0" precision="I64" /> + </input> + <output> + <port id="1" precision="I64" names="2473,2474,2478,2479" /> + </output> + </layer> + <layer id="3026" name="Constant_220726" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3027" name="__module.model.layers.12.self_attn/aten::slice/Reshape_13" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3028" name="__module.model.layers.12.self_attn/aten::slice/Reshape_9" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694676" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3029" name="__module.model.layers.12.self_attn/aten::slice/Reshape_10" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3030" name="__module.model.layers.12.self_attn/aten::slice/Reshape_11" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3031" name="__module.model.layers.12.self_attn/aten::slice/Slice_2" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="2480,x2.51"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="3032" name="Constant_290173" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1, 1" offset="792694684" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3033" name="__module.model.layers.12.self_attn/aten::neg/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2481"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="3034" name="__module.model.layers.12.self_attn/aten::slice/Reshape_12" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3035" name="__module.model.layers.12.self_attn/aten::slice/Reshape_14" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3036" name="__module.model.layers.12.self_attn/aten::slice/Reshape_15" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3037" name="__module.model.layers.12.self_attn/aten::slice/Slice_3" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="2475"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="3038" name="__module.model.layers.12.self_attn/aten::cat/Concat_1" type="Concat" version="opset1"> + <data axis="-1" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2483"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3039" name="__module.model.layers.12.self_attn/aten::mul/Multiply_3" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2484"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3040" name="__module.model.layers.12.self_attn/aten::add/Add_1" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2485"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3041" name="__module.model.layers.12.self_attn/aten::cat/Concat_2" type="Concat" version="opset1"> + <data axis="-2" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="present.12.key"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3042" name="__module.model.layers.12.self_attn/aten::unsqueeze/Unsqueeze_2" type="Unsqueeze" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="FP32" names="2497,2498,2499"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3043" name="__module.model.layers.12.self_attn/aten::size/ShapeOf_6" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3044" name="Constant_302424" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="938477672" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="3045" name="Constant_302425" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="3046" name="Gather_302426" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="3047" name="Constant_268266" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="795420624" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3048" name="Constant_276611" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795420632" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="3049" name="Constant_276612" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="3050" name="Gather_276613" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="3051" name="__module.model.layers.12.self_attn/prim::ListConstruct/Concat_2" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="3" precision="I64" names="2500"> + <dim>5</dim> + </port> + </output> + </layer> + <layer id="3052" name="__module.model.layers.12.self_attn/aten::expand/Broadcast" type="Broadcast" version="opset3"> + <data mode="bidirectional" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>5</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2501,hidden_states.371"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3053" name="Constant_301771" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420648" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3054" name="__module.model.layers.12.self_attn/aten::reshape/Reshape" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2505,key_states.55"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3055" name="Constant_341100" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="3056" name="Constant_341093" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="12" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3057" name="Constant_341095" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3058" name="Constant_341097" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="20" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3059" name="Concat_341098" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3060" name="Broadcast_341101" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32" /> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3061" name="ReadValue_333094" type="ReadValue" version="opset6"> + <data variable_id="past_key_values.12.valuepresent.12.value" variable_type="f32" variable_shape="?,8,?,128" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="past_key_values.12.value"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3062" name="Constant_325384" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="3063" name="Gather_325385" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3064" name="self.model.layers.12.self_attn.v_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 128" offset="2512103544" size="2621440" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3065" name="Convert_387237" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3066" name="self.model.layers.12.self_attn.v_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 1" offset="2514724984" size="20480" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3067" name="Convert_387239" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3068" name="self.model.layers.12.self_attn.v_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3069" name="self.model.layers.12.self_attn.v_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="1024, 40, 1" offset="2514745464" size="81920" /> + <output> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3070" name="self.model.layers.12.self_attn.v_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3071" name="Constant_387244" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795418528" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="3072" name="Reshape_387245" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="3073" name="__module.model.layers.12.self_attn.v_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="3074" name="__module.model.layers.12.self_attn.v_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="3075" name="self.model.layers.12.self_attn.v_proj.bias" type="Const" version="opset1"> + <data element_type="bf16" shape="1024" offset="2514827384" size="2048" /> + <output> + <port id="0" precision="BF16" names="self.model.layers.12.self_attn.v_proj.bias"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="3076" name="__module.model.layers.12.self_attn.v_proj/prim::PythonOp/ConvertLike_1" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="BF16"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="3077" name="__module.model.layers.12.self_attn.v_proj/prim::PythonOp/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2442,value_states.25"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="3078" name="Constant_301772" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420592" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3079" name="__module.model.layers.12.self_attn/aten::view/Reshape_2" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2450"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3080" name="__module.model.layers.12.self_attn/aten::transpose/ScatterElementsUpdate_2" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3081" name="__module.model.layers.12.self_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2451"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3082" name="__module.model.layers.12.self_attn/aten::cat/Concat_3" type="Concat" version="opset1"> + <data axis="-2" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="present.12.value"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3083" name="__module.model.layers.12.self_attn/aten::unsqueeze/Unsqueeze_3" type="Unsqueeze" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="FP32" names="2513,2514,2515"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3084" name="__module.model.layers.12.self_attn/aten::size/ShapeOf_10" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3085" name="Constant_302157" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3086" name="__module.model.layers.12.self_attn/aten::size/Constant_11" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="3087" name="__module.model.layers.12.self_attn/aten::size/Gather_11" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="2507"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3088" name="Constant_268284" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="795420624" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3089" name="Constant_276621" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795420632" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="3090" name="Constant_276622" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="3091" name="Gather_276623" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="3092" name="__module.model.layers.12.self_attn/prim::ListConstruct/Concat_5" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="4" precision="I64" names="2516"> + <dim>5</dim> + </port> + </output> + </layer> + <layer id="3093" name="__module.model.layers.12.self_attn/aten::expand/Broadcast_1" type="Broadcast" version="opset3"> + <data mode="bidirectional" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>5</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2517,hidden_states.375"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3094" name="Constant_301773" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420648" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3095" name="__module.model.layers.12.self_attn/aten::reshape/Reshape_1" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2521"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3096" name="__module.model.layers.12.self_attn/aten::slice/Reshape_60" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3097" name="ShapeOf_298612" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3098" name="Constant_298613" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694668" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3099" name="Constant_298614" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="3100" name="Gather_298615" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3101" name="ShapeOf_298616" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3102" name="Constant_298617" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694668" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3103" name="Constant_298618" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="3104" name="Gather_298619" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3105" name="Add_298620" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64" names="2522"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3106" name="__module.model.layers.12.self_attn/aten::slice/Reshape_62" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3107" name="__module.model.layers.12.self_attn/aten::slice/Reshape_63" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3108" name="__module.model.layers.12.self_attn/aten::slice/Slice_15" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="2526"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="3109" name="__module.model.layers.12.self_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> + <data causal="false" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="2527,attn_output.49"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3110" name="__module.model.layers.12.self_attn/aten::transpose/ScatterElementsUpdate_3" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3111" name="__module.model.layers.12.self_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2528"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3112" name="Constant_301774" type="Const" version="opset1"> + <data element_type="i64" shape="3" offset="798146608" size="24" /> + <output> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="3113" name="__module.model.layers.12.self_attn/aten::view/Reshape_3" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>3</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2531"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="3114" name="self.model.layers.12.self_attn.o_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 128" offset="2514829432" size="13107200" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3115" name="Convert_386277" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3116" name="self.model.layers.12.self_attn.o_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 1" offset="2527936632" size="102400" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3117" name="Convert_386279" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3118" name="self.model.layers.12.self_attn.o_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3119" name="self.model.layers.12.self_attn.o_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="5120, 40, 1" offset="2528039032" size="409600" /> + <output> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3120" name="self.model.layers.12.self_attn.o_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3121" name="Constant_386284" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="792684080" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="3122" name="Reshape_386285" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="3123" name="__module.model.layers.12.self_attn.o_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="3124" name="__module.model.layers.12.self_attn.o_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2533,2535,hidden_states.377"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="3125" name="__module.model.layers.12/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2538,2540,2551,hidden_states.379,hidden_states.381"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="3126" name="Constant_290177" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 5120" offset="2528448632" size="20480" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="3127" name="Constant_290176" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064860" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3128" name="Constant_290174" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064864" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3129" name="__module.model.layers.12.post_attention_layernorm/aten::pow/Power" type="Power" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2541"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="3130" name="Constant_9188" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64" names="2542"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3131" name="__module.model.layers.12.post_attention_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> + <data keep_dims="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2543,variance.51"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3132" name="Constant_290175" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064876" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3133" name="__module.model.layers.12.post_attention_layernorm/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2544"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3134" name="__module.model.layers.12.post_attention_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3135" name="__module.model.layers.12.post_attention_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2545"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3136" name="__module.model.layers.12.post_attention_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2546,2547,hidden_states.383,hidden_states.385"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="3137" name="__module.model.layers.12.post_attention_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2548,2550"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="3138" name="self.model.layers.12.mlp.gate_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 128" offset="2528469112" size="35389440" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3139" name="Convert_384957" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3140" name="self.model.layers.12.mlp.gate_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 1" offset="2563858552" size="276480" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3141" name="Convert_384959" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3142" name="self.model.layers.12.mlp.gate_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3143" name="self.model.layers.12.mlp.gate_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="13824, 40, 1" offset="2564135032" size="1105920" /> + <output> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3144" name="self.model.layers.12.mlp.gate_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3145" name="Constant_384964" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="848558152" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="3146" name="Reshape_384965" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="3147" name="__module.model.layers.12.mlp.gate_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="3148" name="__module.model.layers.12.mlp.gate_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2556,input.25"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="3149" name="__module.model.layers.12.mlp.act_fn/aten::silu/Swish" type="Swish" version="opset4"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="2557"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="3150" name="self.model.layers.12.mlp.up_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 128" offset="2565240952" size="35389440" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3151" name="Convert_384947" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3152" name="self.model.layers.12.mlp.up_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 1" offset="2600630392" size="276480" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3153" name="Convert_384949" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3154" name="self.model.layers.12.mlp.up_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3155" name="self.model.layers.12.mlp.up_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="13824, 40, 1" offset="2600906872" size="1105920" /> + <output> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3156" name="self.model.layers.12.mlp.up_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3157" name="Constant_384954" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="848558152" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="3158" name="Reshape_384955" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="3159" name="__module.model.layers.12.mlp.up_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="3160" name="__module.model.layers.12.mlp.up_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2559"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="3161" name="__module.model.layers.12.mlp/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2560"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="3162" name="self.model.layers.12.mlp.down_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 108, 128" offset="2602012792" size="35389440" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3163" name="Convert_384967" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3164" name="self.model.layers.12.mlp.down_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 108, 1" offset="2637402232" size="276480" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3165" name="Convert_384969" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3166" name="self.model.layers.12.mlp.down_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3167" name="self.model.layers.12.mlp.down_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="5120, 108, 1" offset="2637678712" size="1105920" /> + <output> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3168" name="self.model.layers.12.mlp.down_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3169" name="Constant_384974" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="922101848" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="3170" name="Reshape_384975" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="3171" name="__module.model.layers.12.mlp.down_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="3172" name="__module.model.layers.12.mlp.down_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2562,hidden_states.387"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="3173" name="__module.model.layers.12/aten::add/Add_1" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2563,2565,2573,2584,hidden_states.389,hidden_states.391"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="3174" name="Constant_290181" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 5120" offset="2638784632" size="20480" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="3175" name="Constant_290180" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064860" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3176" name="Constant_290178" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064864" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3177" name="__module.model.layers.13.input_layernorm/aten::pow/Power" type="Power" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2574"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="3178" name="Constant_9262" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64" names="2575"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3179" name="__module.model.layers.13.input_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> + <data keep_dims="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2576,variance.53"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3180" name="Constant_290179" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064876" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3181" name="__module.model.layers.13.input_layernorm/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2577"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3182" name="__module.model.layers.13.input_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3183" name="__module.model.layers.13.input_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2578"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3184" name="__module.model.layers.13.input_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2579,2580,hidden_states.393,hidden_states.395"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="3185" name="__module.model.layers.13.input_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2581,2583,hidden_states.397"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="3186" name="self.model.layers.13.self_attn.q_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 128" offset="2638805112" size="13107200" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3187" name="Convert_386287" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3188" name="self.model.layers.13.self_attn.q_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 1" offset="2651912312" size="102400" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3189" name="Convert_386289" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3190" name="self.model.layers.13.self_attn.q_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3191" name="self.model.layers.13.self_attn.q_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="5120, 40, 1" offset="2652014712" size="409600" /> + <output> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3192" name="self.model.layers.13.self_attn.q_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3193" name="Constant_386294" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="792684080" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="3194" name="Reshape_386295" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="3195" name="__module.model.layers.13.self_attn.q_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="3196" name="__module.model.layers.13.self_attn.q_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="3197" name="self.model.layers.13.self_attn.q_proj.bias" type="Const" version="opset1"> + <data element_type="bf16" shape="5120" offset="2652424312" size="10240" /> + <output> + <port id="0" precision="BF16" names="self.model.layers.13.self_attn.q_proj.bias"> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="3198" name="__module.model.layers.13.self_attn.q_proj/prim::PythonOp/ConvertLike_1" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="BF16"> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="3199" name="__module.model.layers.13.self_attn.q_proj/prim::PythonOp/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2593,query_states.27"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="3200" name="Constant_301775" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="792694336" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3201" name="__module.model.layers.13.self_attn/aten::view/Reshape" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2601"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3202" name="__module.model.layers.13.self_attn/aten::transpose/ScatterElementsUpdate" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3203" name="__module.model.layers.13.self_attn/aten::transpose/Transpose" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2602,q.27"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3204" name="__module.model.layers.13.self_attn/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2611"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3205" name="__module.model.layers.13.self_attn/aten::size/ShapeOf_3" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3206" name="__module.model.layers.13.self_attn/aten::size/Constant_3" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="3207" name="__module.model.layers.13.self_attn/aten::size/Gather_3" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="2612,2617" /> + </output> + </layer> + <layer id="3208" name="__module.model.layers.13.self_attn/aten::floor_divide/Divide_1" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" /> + </output> + </layer> + <layer id="3209" name="__module.model.layers.13.self_attn/aten::floor_divide/Floor_1" type="Floor" version="opset1"> + <input> + <port id="0" precision="I64" /> + </input> + <output> + <port id="1" precision="I64" names="2614,2615,2619,2620" /> + </output> + </layer> + <layer id="3210" name="Constant_220740" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3211" name="__module.model.layers.13.self_attn/aten::slice/Reshape_5" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3212" name="__module.model.layers.13.self_attn/aten::slice/Reshape_1" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694676" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3213" name="__module.model.layers.13.self_attn/aten::slice/Reshape_2" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3214" name="__module.model.layers.13.self_attn/aten::slice/Reshape_3" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3215" name="__module.model.layers.13.self_attn/aten::slice/Slice" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="2621,x2.53"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="3216" name="Constant_290182" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1, 1" offset="792694684" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3217" name="__module.model.layers.13.self_attn/aten::neg/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2622"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="3218" name="__module.model.layers.13.self_attn/aten::slice/Reshape_4" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3219" name="__module.model.layers.13.self_attn/aten::slice/Reshape_6" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3220" name="__module.model.layers.13.self_attn/aten::slice/Reshape_7" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3221" name="__module.model.layers.13.self_attn/aten::slice/Slice_1" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="2616"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="3222" name="__module.model.layers.13.self_attn/aten::cat/Concat" type="Concat" version="opset1"> + <data axis="-1" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2624"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3223" name="__module.model.layers.13.self_attn/aten::mul/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2625"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3224" name="__module.model.layers.13.self_attn/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2626"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3225" name="Constant_341113" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="3226" name="Constant_341106" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="12" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3227" name="Constant_341108" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3228" name="Constant_341110" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="20" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3229" name="Concat_341111" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3230" name="Broadcast_341114" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32" /> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3231" name="ReadValue_333096" type="ReadValue" version="opset6"> + <data variable_id="past_key_values.13.keypresent.13.key" variable_type="f32" variable_shape="?,8,?,128" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="past_key_values.13.key"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3232" name="Constant_325387" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="3233" name="Gather_325388" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3234" name="self.model.layers.13.self_attn.k_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 128" offset="2652434552" size="2621440" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3235" name="Convert_387247" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3236" name="self.model.layers.13.self_attn.k_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 1" offset="2655055992" size="20480" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3237" name="Convert_387249" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3238" name="self.model.layers.13.self_attn.k_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3239" name="self.model.layers.13.self_attn.k_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="1024, 40, 1" offset="2655076472" size="81920" /> + <output> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3240" name="self.model.layers.13.self_attn.k_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3241" name="Constant_387254" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795418528" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="3242" name="Reshape_387255" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="3243" name="__module.model.layers.13.self_attn.k_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="3244" name="__module.model.layers.13.self_attn.k_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="3245" name="self.model.layers.13.self_attn.k_proj.bias" type="Const" version="opset1"> + <data element_type="bf16" shape="1024" offset="2655158392" size="2048" /> + <output> + <port id="0" precision="BF16" names="self.model.layers.13.self_attn.k_proj.bias"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="3246" name="__module.model.layers.13.self_attn.k_proj/prim::PythonOp/ConvertLike_1" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="BF16"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="3247" name="__module.model.layers.13.self_attn.k_proj/prim::PythonOp/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2596,key_states.57"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="3248" name="Constant_301776" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420592" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3249" name="__module.model.layers.13.self_attn/aten::view/Reshape_1" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2604"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3250" name="__module.model.layers.13.self_attn/aten::transpose/ScatterElementsUpdate_1" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3251" name="__module.model.layers.13.self_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2605,k.27"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3252" name="__module.model.layers.13.self_attn/aten::mul/Multiply_2" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2627"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3253" name="__module.model.layers.13.self_attn/aten::size/ShapeOf_5" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3254" name="__module.model.layers.13.self_attn/aten::size/Constant_5" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="3255" name="__module.model.layers.13.self_attn/aten::size/Gather_5" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="2628,2633" /> + </output> + </layer> + <layer id="3256" name="__module.model.layers.13.self_attn/aten::floor_divide/Divide_3" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" /> + </output> + </layer> + <layer id="3257" name="__module.model.layers.13.self_attn/aten::floor_divide/Floor_3" type="Floor" version="opset1"> + <input> + <port id="0" precision="I64" /> + </input> + <output> + <port id="1" precision="I64" names="2630,2631,2635,2636" /> + </output> + </layer> + <layer id="3258" name="Constant_220741" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3259" name="__module.model.layers.13.self_attn/aten::slice/Reshape_13" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3260" name="__module.model.layers.13.self_attn/aten::slice/Reshape_9" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694676" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3261" name="__module.model.layers.13.self_attn/aten::slice/Reshape_10" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3262" name="__module.model.layers.13.self_attn/aten::slice/Reshape_11" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3263" name="__module.model.layers.13.self_attn/aten::slice/Slice_2" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="2637,x2.55"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="3264" name="Constant_290183" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1, 1" offset="792694684" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3265" name="__module.model.layers.13.self_attn/aten::neg/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2638"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="3266" name="__module.model.layers.13.self_attn/aten::slice/Reshape_12" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3267" name="__module.model.layers.13.self_attn/aten::slice/Reshape_14" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3268" name="__module.model.layers.13.self_attn/aten::slice/Reshape_15" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3269" name="__module.model.layers.13.self_attn/aten::slice/Slice_3" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="2632"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="3270" name="__module.model.layers.13.self_attn/aten::cat/Concat_1" type="Concat" version="opset1"> + <data axis="-1" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2640"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3271" name="__module.model.layers.13.self_attn/aten::mul/Multiply_3" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2641"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3272" name="__module.model.layers.13.self_attn/aten::add/Add_1" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2642"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3273" name="__module.model.layers.13.self_attn/aten::cat/Concat_2" type="Concat" version="opset1"> + <data axis="-2" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="present.13.key"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3274" name="__module.model.layers.13.self_attn/aten::unsqueeze/Unsqueeze_2" type="Unsqueeze" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="FP32" names="2654,2655,2656"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3275" name="__module.model.layers.13.self_attn/aten::size/ShapeOf_6" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3276" name="Constant_302429" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="938477672" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="3277" name="Constant_302430" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="3278" name="Gather_302431" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="3279" name="Constant_268302" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="795420624" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3280" name="Constant_276646" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795420632" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="3281" name="Constant_276647" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="3282" name="Gather_276648" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="3283" name="__module.model.layers.13.self_attn/prim::ListConstruct/Concat_2" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="3" precision="I64" names="2657"> + <dim>5</dim> + </port> + </output> + </layer> + <layer id="3284" name="__module.model.layers.13.self_attn/aten::expand/Broadcast" type="Broadcast" version="opset3"> + <data mode="bidirectional" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>5</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2658,hidden_states.401"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3285" name="Constant_301777" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420648" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3286" name="__module.model.layers.13.self_attn/aten::reshape/Reshape" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2662,key_states.59"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3287" name="Constant_341126" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="3288" name="Constant_341119" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="12" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3289" name="Constant_341121" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3290" name="Constant_341123" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="20" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3291" name="Concat_341124" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3292" name="Broadcast_341127" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32" /> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3293" name="ReadValue_333098" type="ReadValue" version="opset6"> + <data variable_id="past_key_values.13.valuepresent.13.value" variable_type="f32" variable_shape="?,8,?,128" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="past_key_values.13.value"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3294" name="Constant_325390" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="3295" name="Gather_325391" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3296" name="self.model.layers.13.self_attn.v_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 128" offset="2655160440" size="2621440" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3297" name="Convert_387257" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3298" name="self.model.layers.13.self_attn.v_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 1" offset="2657781880" size="20480" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3299" name="Convert_387259" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3300" name="self.model.layers.13.self_attn.v_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3301" name="self.model.layers.13.self_attn.v_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="1024, 40, 1" offset="2657802360" size="81920" /> + <output> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3302" name="self.model.layers.13.self_attn.v_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3303" name="Constant_387264" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795418528" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="3304" name="Reshape_387265" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="3305" name="__module.model.layers.13.self_attn.v_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="3306" name="__module.model.layers.13.self_attn.v_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="3307" name="self.model.layers.13.self_attn.v_proj.bias" type="Const" version="opset1"> + <data element_type="bf16" shape="1024" offset="2657884280" size="2048" /> + <output> + <port id="0" precision="BF16" names="self.model.layers.13.self_attn.v_proj.bias"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="3308" name="__module.model.layers.13.self_attn.v_proj/prim::PythonOp/ConvertLike_1" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="BF16"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="3309" name="__module.model.layers.13.self_attn.v_proj/prim::PythonOp/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2599,value_states.27"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="3310" name="Constant_301778" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420592" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3311" name="__module.model.layers.13.self_attn/aten::view/Reshape_2" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2607"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3312" name="__module.model.layers.13.self_attn/aten::transpose/ScatterElementsUpdate_2" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3313" name="__module.model.layers.13.self_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2608"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3314" name="__module.model.layers.13.self_attn/aten::cat/Concat_3" type="Concat" version="opset1"> + <data axis="-2" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="present.13.value"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3315" name="__module.model.layers.13.self_attn/aten::unsqueeze/Unsqueeze_3" type="Unsqueeze" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="FP32" names="2670,2671,2672"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3316" name="__module.model.layers.13.self_attn/aten::size/ShapeOf_10" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3317" name="Constant_302163" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3318" name="__module.model.layers.13.self_attn/aten::size/Constant_11" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="3319" name="__module.model.layers.13.self_attn/aten::size/Gather_11" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="2664"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3320" name="Constant_268320" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="795420624" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3321" name="Constant_276656" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795420632" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="3322" name="Constant_276657" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="3323" name="Gather_276658" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="3324" name="__module.model.layers.13.self_attn/prim::ListConstruct/Concat_5" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="4" precision="I64" names="2673"> + <dim>5</dim> + </port> + </output> + </layer> + <layer id="3325" name="__module.model.layers.13.self_attn/aten::expand/Broadcast_1" type="Broadcast" version="opset3"> + <data mode="bidirectional" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>5</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2674,hidden_states.405"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3326" name="Constant_301779" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420648" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3327" name="__module.model.layers.13.self_attn/aten::reshape/Reshape_1" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2678"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3328" name="__module.model.layers.13.self_attn/aten::slice/Reshape_60" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3329" name="ShapeOf_298698" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3330" name="Constant_298699" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694668" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3331" name="Constant_298700" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="3332" name="Gather_298701" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3333" name="ShapeOf_298702" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3334" name="Constant_298703" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694668" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3335" name="Constant_298704" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="3336" name="Gather_298705" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3337" name="Add_298706" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64" names="2679"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3338" name="__module.model.layers.13.self_attn/aten::slice/Reshape_62" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3339" name="__module.model.layers.13.self_attn/aten::slice/Reshape_63" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3340" name="__module.model.layers.13.self_attn/aten::slice/Slice_15" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="2683"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="3341" name="__module.model.layers.13.self_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> + <data causal="false" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="2684,attn_output.53"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3342" name="__module.model.layers.13.self_attn/aten::transpose/ScatterElementsUpdate_3" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3343" name="__module.model.layers.13.self_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2685"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3344" name="Constant_301780" type="Const" version="opset1"> + <data element_type="i64" shape="3" offset="798146608" size="24" /> + <output> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="3345" name="__module.model.layers.13.self_attn/aten::view/Reshape_3" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>3</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2688"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="3346" name="self.model.layers.13.self_attn.o_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 128" offset="2657886328" size="13107200" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3347" name="Convert_386297" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3348" name="self.model.layers.13.self_attn.o_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 1" offset="2670993528" size="102400" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3349" name="Convert_386299" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3350" name="self.model.layers.13.self_attn.o_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3351" name="self.model.layers.13.self_attn.o_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="5120, 40, 1" offset="2671095928" size="409600" /> + <output> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3352" name="self.model.layers.13.self_attn.o_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3353" name="Constant_386304" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="792684080" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="3354" name="Reshape_386305" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="3355" name="__module.model.layers.13.self_attn.o_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="3356" name="__module.model.layers.13.self_attn.o_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2690,2692,hidden_states.407"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="3357" name="__module.model.layers.13/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2695,2697,2708,hidden_states.409,hidden_states.411"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="3358" name="Constant_290187" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 5120" offset="2671505528" size="20480" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="3359" name="Constant_290186" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064860" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3360" name="Constant_290184" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064864" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3361" name="__module.model.layers.13.post_attention_layernorm/aten::pow/Power" type="Power" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2698"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="3362" name="Constant_9860" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64" names="2699"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3363" name="__module.model.layers.13.post_attention_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> + <data keep_dims="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2700,variance.55"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3364" name="Constant_290185" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064876" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3365" name="__module.model.layers.13.post_attention_layernorm/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2701"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3366" name="__module.model.layers.13.post_attention_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3367" name="__module.model.layers.13.post_attention_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2702"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3368" name="__module.model.layers.13.post_attention_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2703,2704,hidden_states.413,hidden_states.415"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="3369" name="__module.model.layers.13.post_attention_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2705,2707"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="3370" name="self.model.layers.13.mlp.gate_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 128" offset="2671526008" size="35389440" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3371" name="Convert_384987" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3372" name="self.model.layers.13.mlp.gate_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 1" offset="2706915448" size="276480" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3373" name="Convert_384989" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3374" name="self.model.layers.13.mlp.gate_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3375" name="self.model.layers.13.mlp.gate_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="13824, 40, 1" offset="2707191928" size="1105920" /> + <output> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3376" name="self.model.layers.13.mlp.gate_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3377" name="Constant_384994" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="848558152" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="3378" name="Reshape_384995" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="3379" name="__module.model.layers.13.mlp.gate_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="3380" name="__module.model.layers.13.mlp.gate_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2713,input.27"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="3381" name="__module.model.layers.13.mlp.act_fn/aten::silu/Swish" type="Swish" version="opset4"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="2714"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="3382" name="self.model.layers.13.mlp.up_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 128" offset="2708297848" size="35389440" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3383" name="Convert_384977" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3384" name="self.model.layers.13.mlp.up_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 1" offset="2743687288" size="276480" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3385" name="Convert_384979" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3386" name="self.model.layers.13.mlp.up_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3387" name="self.model.layers.13.mlp.up_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="13824, 40, 1" offset="2743963768" size="1105920" /> + <output> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3388" name="self.model.layers.13.mlp.up_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3389" name="Constant_384984" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="848558152" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="3390" name="Reshape_384985" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="3391" name="__module.model.layers.13.mlp.up_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="3392" name="__module.model.layers.13.mlp.up_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2716"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="3393" name="__module.model.layers.13.mlp/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2717"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="3394" name="self.model.layers.13.mlp.down_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 108, 128" offset="2745069688" size="35389440" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3395" name="Convert_384997" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3396" name="self.model.layers.13.mlp.down_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 108, 1" offset="2780459128" size="276480" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3397" name="Convert_384999" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3398" name="self.model.layers.13.mlp.down_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3399" name="self.model.layers.13.mlp.down_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="5120, 108, 1" offset="2780735608" size="1105920" /> + <output> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3400" name="self.model.layers.13.mlp.down_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3401" name="Constant_385004" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="922101848" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="3402" name="Reshape_385005" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="3403" name="__module.model.layers.13.mlp.down_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="3404" name="__module.model.layers.13.mlp.down_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2719,hidden_states.417"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="3405" name="__module.model.layers.13/aten::add/Add_1" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2720,2722,2730,2741,hidden_states.419,hidden_states.421"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="3406" name="Constant_290191" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 5120" offset="2781841528" size="20480" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="3407" name="Constant_290190" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064860" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3408" name="Constant_290188" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064864" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3409" name="__module.model.layers.14.input_layernorm/aten::pow/Power" type="Power" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2731"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="3410" name="Constant_9934" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64" names="2732"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3411" name="__module.model.layers.14.input_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> + <data keep_dims="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2733,variance.57"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3412" name="Constant_290189" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064876" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3413" name="__module.model.layers.14.input_layernorm/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2734"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3414" name="__module.model.layers.14.input_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3415" name="__module.model.layers.14.input_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2735"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3416" name="__module.model.layers.14.input_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2736,2737,hidden_states.423,hidden_states.425"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="3417" name="__module.model.layers.14.input_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2738,2740,hidden_states.427"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="3418" name="self.model.layers.14.self_attn.q_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 128" offset="2781862008" size="13107200" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3419" name="Convert_386307" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3420" name="self.model.layers.14.self_attn.q_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 1" offset="2794969208" size="102400" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3421" name="Convert_386309" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3422" name="self.model.layers.14.self_attn.q_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3423" name="self.model.layers.14.self_attn.q_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="5120, 40, 1" offset="2795071608" size="409600" /> + <output> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3424" name="self.model.layers.14.self_attn.q_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3425" name="Constant_386314" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="792684080" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="3426" name="Reshape_386315" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="3427" name="__module.model.layers.14.self_attn.q_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="3428" name="__module.model.layers.14.self_attn.q_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="3429" name="self.model.layers.14.self_attn.q_proj.bias" type="Const" version="opset1"> + <data element_type="bf16" shape="5120" offset="2795481208" size="10240" /> + <output> + <port id="0" precision="BF16" names="self.model.layers.14.self_attn.q_proj.bias"> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="3430" name="__module.model.layers.14.self_attn.q_proj/prim::PythonOp/ConvertLike_1" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="BF16"> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="3431" name="__module.model.layers.14.self_attn.q_proj/prim::PythonOp/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2750,query_states.29"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="3432" name="Constant_301781" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="792694336" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3433" name="__module.model.layers.14.self_attn/aten::view/Reshape" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2758"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3434" name="__module.model.layers.14.self_attn/aten::transpose/ScatterElementsUpdate" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3435" name="__module.model.layers.14.self_attn/aten::transpose/Transpose" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2759,q.29"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3436" name="__module.model.layers.14.self_attn/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2768"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3437" name="__module.model.layers.14.self_attn/aten::size/ShapeOf_3" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3438" name="__module.model.layers.14.self_attn/aten::size/Constant_3" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="3439" name="__module.model.layers.14.self_attn/aten::size/Gather_3" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="2769,2774" /> + </output> + </layer> + <layer id="3440" name="__module.model.layers.14.self_attn/aten::floor_divide/Divide_1" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" /> + </output> + </layer> + <layer id="3441" name="__module.model.layers.14.self_attn/aten::floor_divide/Floor_1" type="Floor" version="opset1"> + <input> + <port id="0" precision="I64" /> + </input> + <output> + <port id="1" precision="I64" names="2771,2772,2776,2777" /> + </output> + </layer> + <layer id="3442" name="Constant_220755" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3443" name="__module.model.layers.14.self_attn/aten::slice/Reshape_5" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3444" name="__module.model.layers.14.self_attn/aten::slice/Reshape_1" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694676" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3445" name="__module.model.layers.14.self_attn/aten::slice/Reshape_2" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3446" name="__module.model.layers.14.self_attn/aten::slice/Reshape_3" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3447" name="__module.model.layers.14.self_attn/aten::slice/Slice" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="2778,x2.57"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="3448" name="Constant_290192" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1, 1" offset="792694684" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3449" name="__module.model.layers.14.self_attn/aten::neg/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2779"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="3450" name="__module.model.layers.14.self_attn/aten::slice/Reshape_4" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3451" name="__module.model.layers.14.self_attn/aten::slice/Reshape_6" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3452" name="__module.model.layers.14.self_attn/aten::slice/Reshape_7" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3453" name="__module.model.layers.14.self_attn/aten::slice/Slice_1" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="2773"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="3454" name="__module.model.layers.14.self_attn/aten::cat/Concat" type="Concat" version="opset1"> + <data axis="-1" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2781"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3455" name="__module.model.layers.14.self_attn/aten::mul/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2782"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3456" name="__module.model.layers.14.self_attn/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2783"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3457" name="Constant_341139" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="3458" name="Constant_341132" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="12" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3459" name="Constant_341134" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3460" name="Constant_341136" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="20" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3461" name="Concat_341137" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3462" name="Broadcast_341140" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32" /> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3463" name="ReadValue_333100" type="ReadValue" version="opset6"> + <data variable_id="past_key_values.14.keypresent.14.key" variable_type="f32" variable_shape="?,8,?,128" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="past_key_values.14.key"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3464" name="Constant_325393" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="3465" name="Gather_325394" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3466" name="self.model.layers.14.self_attn.k_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 128" offset="2795491448" size="2621440" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3467" name="Convert_387267" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3468" name="self.model.layers.14.self_attn.k_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 1" offset="2798112888" size="20480" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3469" name="Convert_387269" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3470" name="self.model.layers.14.self_attn.k_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3471" name="self.model.layers.14.self_attn.k_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="1024, 40, 1" offset="2798133368" size="81920" /> + <output> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3472" name="self.model.layers.14.self_attn.k_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3473" name="Constant_387274" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795418528" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="3474" name="Reshape_387275" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="3475" name="__module.model.layers.14.self_attn.k_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="3476" name="__module.model.layers.14.self_attn.k_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="3477" name="self.model.layers.14.self_attn.k_proj.bias" type="Const" version="opset1"> + <data element_type="bf16" shape="1024" offset="2798215288" size="2048" /> + <output> + <port id="0" precision="BF16" names="self.model.layers.14.self_attn.k_proj.bias"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="3478" name="__module.model.layers.14.self_attn.k_proj/prim::PythonOp/ConvertLike_1" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="BF16"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="3479" name="__module.model.layers.14.self_attn.k_proj/prim::PythonOp/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2753,key_states.61"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="3480" name="Constant_301782" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420592" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3481" name="__module.model.layers.14.self_attn/aten::view/Reshape_1" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2761"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3482" name="__module.model.layers.14.self_attn/aten::transpose/ScatterElementsUpdate_1" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3483" name="__module.model.layers.14.self_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2762,k.29"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3484" name="__module.model.layers.14.self_attn/aten::mul/Multiply_2" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2784"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3485" name="__module.model.layers.14.self_attn/aten::size/ShapeOf_5" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3486" name="__module.model.layers.14.self_attn/aten::size/Constant_5" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="3487" name="__module.model.layers.14.self_attn/aten::size/Gather_5" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="2785,2790" /> + </output> + </layer> + <layer id="3488" name="__module.model.layers.14.self_attn/aten::floor_divide/Divide_3" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" /> + </output> + </layer> + <layer id="3489" name="__module.model.layers.14.self_attn/aten::floor_divide/Floor_3" type="Floor" version="opset1"> + <input> + <port id="0" precision="I64" /> + </input> + <output> + <port id="1" precision="I64" names="2787,2788,2792,2793" /> + </output> + </layer> + <layer id="3490" name="Constant_220756" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3491" name="__module.model.layers.14.self_attn/aten::slice/Reshape_13" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3492" name="__module.model.layers.14.self_attn/aten::slice/Reshape_9" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694676" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3493" name="__module.model.layers.14.self_attn/aten::slice/Reshape_10" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3494" name="__module.model.layers.14.self_attn/aten::slice/Reshape_11" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3495" name="__module.model.layers.14.self_attn/aten::slice/Slice_2" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="2794,x2.59"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="3496" name="Constant_290193" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1, 1" offset="792694684" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3497" name="__module.model.layers.14.self_attn/aten::neg/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2795"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="3498" name="__module.model.layers.14.self_attn/aten::slice/Reshape_12" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3499" name="__module.model.layers.14.self_attn/aten::slice/Reshape_14" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3500" name="__module.model.layers.14.self_attn/aten::slice/Reshape_15" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3501" name="__module.model.layers.14.self_attn/aten::slice/Slice_3" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="2789"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="3502" name="__module.model.layers.14.self_attn/aten::cat/Concat_1" type="Concat" version="opset1"> + <data axis="-1" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2797"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3503" name="__module.model.layers.14.self_attn/aten::mul/Multiply_3" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2798"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3504" name="__module.model.layers.14.self_attn/aten::add/Add_1" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2799"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3505" name="__module.model.layers.14.self_attn/aten::cat/Concat_2" type="Concat" version="opset1"> + <data axis="-2" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="present.14.key"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3506" name="__module.model.layers.14.self_attn/aten::unsqueeze/Unsqueeze_2" type="Unsqueeze" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="FP32" names="2811,2812,2813"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3507" name="__module.model.layers.14.self_attn/aten::size/ShapeOf_6" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3508" name="Constant_302434" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="938477672" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="3509" name="Constant_302435" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="3510" name="Gather_302436" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="3511" name="Constant_268338" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="795420624" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3512" name="Constant_276681" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795420632" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="3513" name="Constant_276682" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="3514" name="Gather_276683" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="3515" name="__module.model.layers.14.self_attn/prim::ListConstruct/Concat_2" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="3" precision="I64" names="2814"> + <dim>5</dim> + </port> + </output> + </layer> + <layer id="3516" name="__module.model.layers.14.self_attn/aten::expand/Broadcast" type="Broadcast" version="opset3"> + <data mode="bidirectional" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>5</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2815,hidden_states.431"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3517" name="Constant_301783" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420648" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3518" name="__module.model.layers.14.self_attn/aten::reshape/Reshape" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2819,key_states.63"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3519" name="Constant_341152" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="3520" name="Constant_341145" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="12" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3521" name="Constant_341147" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3522" name="Constant_341149" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="20" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3523" name="Concat_341150" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3524" name="Broadcast_341153" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32" /> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3525" name="ReadValue_333102" type="ReadValue" version="opset6"> + <data variable_id="past_key_values.14.valuepresent.14.value" variable_type="f32" variable_shape="?,8,?,128" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="past_key_values.14.value"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3526" name="Constant_325396" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="3527" name="Gather_325397" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3528" name="self.model.layers.14.self_attn.v_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 128" offset="2798217336" size="2621440" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3529" name="Convert_387277" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3530" name="self.model.layers.14.self_attn.v_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 1" offset="2800838776" size="20480" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3531" name="Convert_387279" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3532" name="self.model.layers.14.self_attn.v_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3533" name="self.model.layers.14.self_attn.v_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="1024, 40, 1" offset="2800859256" size="81920" /> + <output> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3534" name="self.model.layers.14.self_attn.v_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3535" name="Constant_387284" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795418528" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="3536" name="Reshape_387285" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="3537" name="__module.model.layers.14.self_attn.v_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="3538" name="__module.model.layers.14.self_attn.v_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="3539" name="self.model.layers.14.self_attn.v_proj.bias" type="Const" version="opset1"> + <data element_type="bf16" shape="1024" offset="2800941176" size="2048" /> + <output> + <port id="0" precision="BF16" names="self.model.layers.14.self_attn.v_proj.bias"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="3540" name="__module.model.layers.14.self_attn.v_proj/prim::PythonOp/ConvertLike_1" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="BF16"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="3541" name="__module.model.layers.14.self_attn.v_proj/prim::PythonOp/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2756,value_states.29"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="3542" name="Constant_301784" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420592" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3543" name="__module.model.layers.14.self_attn/aten::view/Reshape_2" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2764"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3544" name="__module.model.layers.14.self_attn/aten::transpose/ScatterElementsUpdate_2" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3545" name="__module.model.layers.14.self_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2765"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3546" name="__module.model.layers.14.self_attn/aten::cat/Concat_3" type="Concat" version="opset1"> + <data axis="-2" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="present.14.value"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3547" name="__module.model.layers.14.self_attn/aten::unsqueeze/Unsqueeze_3" type="Unsqueeze" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="FP32" names="2827,2828,2829"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3548" name="__module.model.layers.14.self_attn/aten::size/ShapeOf_10" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3549" name="Constant_302169" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3550" name="__module.model.layers.14.self_attn/aten::size/Constant_11" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="3551" name="__module.model.layers.14.self_attn/aten::size/Gather_11" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="2821"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3552" name="Constant_268356" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="795420624" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3553" name="Constant_276691" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795420632" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="3554" name="Constant_276692" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="3555" name="Gather_276693" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="3556" name="__module.model.layers.14.self_attn/prim::ListConstruct/Concat_5" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="4" precision="I64" names="2830"> + <dim>5</dim> + </port> + </output> + </layer> + <layer id="3557" name="__module.model.layers.14.self_attn/aten::expand/Broadcast_1" type="Broadcast" version="opset3"> + <data mode="bidirectional" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>5</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2831,hidden_states.435"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3558" name="Constant_301785" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420648" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3559" name="__module.model.layers.14.self_attn/aten::reshape/Reshape_1" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2835"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3560" name="__module.model.layers.14.self_attn/aten::slice/Reshape_60" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3561" name="ShapeOf_298784" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3562" name="Constant_298785" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694668" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3563" name="Constant_298786" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="3564" name="Gather_298787" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3565" name="ShapeOf_298788" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3566" name="Constant_298789" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694668" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3567" name="Constant_298790" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="3568" name="Gather_298791" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3569" name="Add_298792" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64" names="2836"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3570" name="__module.model.layers.14.self_attn/aten::slice/Reshape_62" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3571" name="__module.model.layers.14.self_attn/aten::slice/Reshape_63" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3572" name="__module.model.layers.14.self_attn/aten::slice/Slice_15" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="2840"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="3573" name="__module.model.layers.14.self_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> + <data causal="false" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="2841,attn_output.57"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3574" name="__module.model.layers.14.self_attn/aten::transpose/ScatterElementsUpdate_3" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3575" name="__module.model.layers.14.self_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2842"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3576" name="Constant_301786" type="Const" version="opset1"> + <data element_type="i64" shape="3" offset="798146608" size="24" /> + <output> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="3577" name="__module.model.layers.14.self_attn/aten::view/Reshape_3" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>3</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2845"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="3578" name="self.model.layers.14.self_attn.o_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 128" offset="2800943224" size="13107200" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3579" name="Convert_386317" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3580" name="self.model.layers.14.self_attn.o_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 1" offset="2814050424" size="102400" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3581" name="Convert_386319" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3582" name="self.model.layers.14.self_attn.o_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3583" name="self.model.layers.14.self_attn.o_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="5120, 40, 1" offset="2814152824" size="409600" /> + <output> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3584" name="self.model.layers.14.self_attn.o_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3585" name="Constant_386324" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="792684080" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="3586" name="Reshape_386325" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="3587" name="__module.model.layers.14.self_attn.o_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="3588" name="__module.model.layers.14.self_attn.o_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2847,2849,hidden_states.437"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="3589" name="__module.model.layers.14/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2852,2854,2865,hidden_states.439,hidden_states.441"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="3590" name="Constant_290197" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 5120" offset="2814562424" size="20480" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="3591" name="Constant_290196" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064860" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3592" name="Constant_290194" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064864" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3593" name="__module.model.layers.14.post_attention_layernorm/aten::pow/Power" type="Power" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2855"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="3594" name="Constant_10532" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64" names="2856"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3595" name="__module.model.layers.14.post_attention_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> + <data keep_dims="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2857,variance.59"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3596" name="Constant_290195" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064876" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3597" name="__module.model.layers.14.post_attention_layernorm/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2858"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3598" name="__module.model.layers.14.post_attention_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3599" name="__module.model.layers.14.post_attention_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2859"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3600" name="__module.model.layers.14.post_attention_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2860,2861,hidden_states.443,hidden_states.445"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="3601" name="__module.model.layers.14.post_attention_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2862,2864"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="3602" name="self.model.layers.14.mlp.gate_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 128" offset="2814582904" size="35389440" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3603" name="Convert_385017" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3604" name="self.model.layers.14.mlp.gate_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 1" offset="2849972344" size="276480" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3605" name="Convert_385019" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3606" name="self.model.layers.14.mlp.gate_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3607" name="self.model.layers.14.mlp.gate_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="13824, 40, 1" offset="2850248824" size="1105920" /> + <output> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3608" name="self.model.layers.14.mlp.gate_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3609" name="Constant_385024" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="848558152" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="3610" name="Reshape_385025" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="3611" name="__module.model.layers.14.mlp.gate_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="3612" name="__module.model.layers.14.mlp.gate_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2870,input.29"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="3613" name="__module.model.layers.14.mlp.act_fn/aten::silu/Swish" type="Swish" version="opset4"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="2871"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="3614" name="self.model.layers.14.mlp.up_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 128" offset="2851354744" size="35389440" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3615" name="Convert_385007" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3616" name="self.model.layers.14.mlp.up_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 1" offset="2886744184" size="276480" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3617" name="Convert_385009" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3618" name="self.model.layers.14.mlp.up_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3619" name="self.model.layers.14.mlp.up_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="13824, 40, 1" offset="2887020664" size="1105920" /> + <output> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3620" name="self.model.layers.14.mlp.up_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3621" name="Constant_385014" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="848558152" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="3622" name="Reshape_385015" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="3623" name="__module.model.layers.14.mlp.up_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="3624" name="__module.model.layers.14.mlp.up_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2873"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="3625" name="__module.model.layers.14.mlp/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2874"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="3626" name="self.model.layers.14.mlp.down_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 108, 128" offset="2888126584" size="35389440" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3627" name="Convert_385027" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3628" name="self.model.layers.14.mlp.down_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 108, 1" offset="2923516024" size="276480" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3629" name="Convert_385029" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3630" name="self.model.layers.14.mlp.down_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3631" name="self.model.layers.14.mlp.down_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="5120, 108, 1" offset="2923792504" size="1105920" /> + <output> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3632" name="self.model.layers.14.mlp.down_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3633" name="Constant_385034" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="922101848" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="3634" name="Reshape_385035" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="3635" name="__module.model.layers.14.mlp.down_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="3636" name="__module.model.layers.14.mlp.down_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2876,hidden_states.447"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="3637" name="__module.model.layers.14/aten::add/Add_1" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2877,2879,2887,2898,hidden_states.449,hidden_states.451"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="3638" name="Constant_290201" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 5120" offset="2924898424" size="20480" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="3639" name="Constant_290200" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064860" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3640" name="Constant_290198" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064864" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3641" name="__module.model.layers.15.input_layernorm/aten::pow/Power" type="Power" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2888"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="3642" name="Constant_10606" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64" names="2889"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3643" name="__module.model.layers.15.input_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> + <data keep_dims="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2890,variance.61"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3644" name="Constant_290199" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064876" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3645" name="__module.model.layers.15.input_layernorm/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2891"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3646" name="__module.model.layers.15.input_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3647" name="__module.model.layers.15.input_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2892"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3648" name="__module.model.layers.15.input_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2893,2894,hidden_states.453,hidden_states.455"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="3649" name="__module.model.layers.15.input_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2895,2897,hidden_states.457"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="3650" name="self.model.layers.15.self_attn.q_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 128" offset="2924918904" size="13107200" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3651" name="Convert_386327" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3652" name="self.model.layers.15.self_attn.q_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 1" offset="2938026104" size="102400" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3653" name="Convert_386329" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3654" name="self.model.layers.15.self_attn.q_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3655" name="self.model.layers.15.self_attn.q_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="5120, 40, 1" offset="2938128504" size="409600" /> + <output> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3656" name="self.model.layers.15.self_attn.q_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3657" name="Constant_386334" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="792684080" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="3658" name="Reshape_386335" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="3659" name="__module.model.layers.15.self_attn.q_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="3660" name="__module.model.layers.15.self_attn.q_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="3661" name="self.model.layers.15.self_attn.q_proj.bias" type="Const" version="opset1"> + <data element_type="bf16" shape="5120" offset="2938538104" size="10240" /> + <output> + <port id="0" precision="BF16" names="self.model.layers.15.self_attn.q_proj.bias"> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="3662" name="__module.model.layers.15.self_attn.q_proj/prim::PythonOp/ConvertLike_1" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="BF16"> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="3663" name="__module.model.layers.15.self_attn.q_proj/prim::PythonOp/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2907,query_states.31"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="3664" name="Constant_301787" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="792694336" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3665" name="__module.model.layers.15.self_attn/aten::view/Reshape" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2915"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3666" name="__module.model.layers.15.self_attn/aten::transpose/ScatterElementsUpdate" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3667" name="__module.model.layers.15.self_attn/aten::transpose/Transpose" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2916,q.31"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3668" name="__module.model.layers.15.self_attn/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2925"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3669" name="__module.model.layers.15.self_attn/aten::size/ShapeOf_3" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3670" name="__module.model.layers.15.self_attn/aten::size/Constant_3" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="3671" name="__module.model.layers.15.self_attn/aten::size/Gather_3" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="2926,2931" /> + </output> + </layer> + <layer id="3672" name="__module.model.layers.15.self_attn/aten::floor_divide/Divide_1" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" /> + </output> + </layer> + <layer id="3673" name="__module.model.layers.15.self_attn/aten::floor_divide/Floor_1" type="Floor" version="opset1"> + <input> + <port id="0" precision="I64" /> + </input> + <output> + <port id="1" precision="I64" names="2928,2929,2933,2934" /> + </output> + </layer> + <layer id="3674" name="Constant_220770" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3675" name="__module.model.layers.15.self_attn/aten::slice/Reshape_5" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3676" name="__module.model.layers.15.self_attn/aten::slice/Reshape_1" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694676" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3677" name="__module.model.layers.15.self_attn/aten::slice/Reshape_2" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3678" name="__module.model.layers.15.self_attn/aten::slice/Reshape_3" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3679" name="__module.model.layers.15.self_attn/aten::slice/Slice" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="2935,x2.61"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="3680" name="Constant_290202" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1, 1" offset="792694684" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3681" name="__module.model.layers.15.self_attn/aten::neg/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2936"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="3682" name="__module.model.layers.15.self_attn/aten::slice/Reshape_4" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3683" name="__module.model.layers.15.self_attn/aten::slice/Reshape_6" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3684" name="__module.model.layers.15.self_attn/aten::slice/Reshape_7" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3685" name="__module.model.layers.15.self_attn/aten::slice/Slice_1" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="2930"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="3686" name="__module.model.layers.15.self_attn/aten::cat/Concat" type="Concat" version="opset1"> + <data axis="-1" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2938"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3687" name="__module.model.layers.15.self_attn/aten::mul/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2939"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3688" name="__module.model.layers.15.self_attn/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2940"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3689" name="Constant_341165" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="3690" name="Constant_341158" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="12" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3691" name="Constant_341160" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3692" name="Constant_341162" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="20" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3693" name="Concat_341163" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3694" name="Broadcast_341166" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32" /> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3695" name="ReadValue_333104" type="ReadValue" version="opset6"> + <data variable_id="past_key_values.15.keypresent.15.key" variable_type="f32" variable_shape="?,8,?,128" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="past_key_values.15.key"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3696" name="Constant_325399" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="3697" name="Gather_325400" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3698" name="self.model.layers.15.self_attn.k_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 128" offset="2938548344" size="2621440" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3699" name="Convert_387287" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3700" name="self.model.layers.15.self_attn.k_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 1" offset="2941169784" size="20480" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3701" name="Convert_387289" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3702" name="self.model.layers.15.self_attn.k_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3703" name="self.model.layers.15.self_attn.k_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="1024, 40, 1" offset="2941190264" size="81920" /> + <output> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3704" name="self.model.layers.15.self_attn.k_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3705" name="Constant_387294" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795418528" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="3706" name="Reshape_387295" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="3707" name="__module.model.layers.15.self_attn.k_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="3708" name="__module.model.layers.15.self_attn.k_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="3709" name="self.model.layers.15.self_attn.k_proj.bias" type="Const" version="opset1"> + <data element_type="bf16" shape="1024" offset="2941272184" size="2048" /> + <output> + <port id="0" precision="BF16" names="self.model.layers.15.self_attn.k_proj.bias"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="3710" name="__module.model.layers.15.self_attn.k_proj/prim::PythonOp/ConvertLike_1" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="BF16"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="3711" name="__module.model.layers.15.self_attn.k_proj/prim::PythonOp/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2910,key_states.65"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="3712" name="Constant_301788" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420592" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3713" name="__module.model.layers.15.self_attn/aten::view/Reshape_1" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2918"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3714" name="__module.model.layers.15.self_attn/aten::transpose/ScatterElementsUpdate_1" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3715" name="__module.model.layers.15.self_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2919,k.31"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3716" name="__module.model.layers.15.self_attn/aten::mul/Multiply_2" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2941"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3717" name="__module.model.layers.15.self_attn/aten::size/ShapeOf_5" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3718" name="__module.model.layers.15.self_attn/aten::size/Constant_5" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="3719" name="__module.model.layers.15.self_attn/aten::size/Gather_5" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="2942,2947" /> + </output> + </layer> + <layer id="3720" name="__module.model.layers.15.self_attn/aten::floor_divide/Divide_3" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" /> + </output> + </layer> + <layer id="3721" name="__module.model.layers.15.self_attn/aten::floor_divide/Floor_3" type="Floor" version="opset1"> + <input> + <port id="0" precision="I64" /> + </input> + <output> + <port id="1" precision="I64" names="2944,2945,2949,2950" /> + </output> + </layer> + <layer id="3722" name="Constant_220771" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3723" name="__module.model.layers.15.self_attn/aten::slice/Reshape_13" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3724" name="__module.model.layers.15.self_attn/aten::slice/Reshape_9" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694676" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3725" name="__module.model.layers.15.self_attn/aten::slice/Reshape_10" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3726" name="__module.model.layers.15.self_attn/aten::slice/Reshape_11" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3727" name="__module.model.layers.15.self_attn/aten::slice/Slice_2" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="2951,x2.63"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="3728" name="Constant_290203" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1, 1" offset="792694684" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3729" name="__module.model.layers.15.self_attn/aten::neg/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2952"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="3730" name="__module.model.layers.15.self_attn/aten::slice/Reshape_12" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3731" name="__module.model.layers.15.self_attn/aten::slice/Reshape_14" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3732" name="__module.model.layers.15.self_attn/aten::slice/Reshape_15" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3733" name="__module.model.layers.15.self_attn/aten::slice/Slice_3" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="2946"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="3734" name="__module.model.layers.15.self_attn/aten::cat/Concat_1" type="Concat" version="opset1"> + <data axis="-1" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2954"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3735" name="__module.model.layers.15.self_attn/aten::mul/Multiply_3" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2955"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3736" name="__module.model.layers.15.self_attn/aten::add/Add_1" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2956"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3737" name="__module.model.layers.15.self_attn/aten::cat/Concat_2" type="Concat" version="opset1"> + <data axis="-2" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="present.15.key"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3738" name="__module.model.layers.15.self_attn/aten::unsqueeze/Unsqueeze_2" type="Unsqueeze" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="FP32" names="2968,2969,2970"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3739" name="__module.model.layers.15.self_attn/aten::size/ShapeOf_6" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3740" name="Constant_302439" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="938477672" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="3741" name="Constant_302440" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="3742" name="Gather_302441" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="3743" name="Constant_268374" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="795420624" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3744" name="Constant_276716" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795420632" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="3745" name="Constant_276717" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="3746" name="Gather_276718" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="3747" name="__module.model.layers.15.self_attn/prim::ListConstruct/Concat_2" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="3" precision="I64" names="2971"> + <dim>5</dim> + </port> + </output> + </layer> + <layer id="3748" name="__module.model.layers.15.self_attn/aten::expand/Broadcast" type="Broadcast" version="opset3"> + <data mode="bidirectional" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>5</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2972,hidden_states.461"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3749" name="Constant_301789" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420648" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3750" name="__module.model.layers.15.self_attn/aten::reshape/Reshape" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2976,key_states.67"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3751" name="Constant_341178" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="3752" name="Constant_341171" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="12" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3753" name="Constant_341173" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3754" name="Constant_341175" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="20" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3755" name="Concat_341176" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3756" name="Broadcast_341179" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32" /> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3757" name="ReadValue_333106" type="ReadValue" version="opset6"> + <data variable_id="past_key_values.15.valuepresent.15.value" variable_type="f32" variable_shape="?,8,?,128" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="past_key_values.15.value"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3758" name="Constant_325402" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="3759" name="Gather_325403" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3760" name="self.model.layers.15.self_attn.v_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 128" offset="2941274232" size="2621440" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3761" name="Convert_387297" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3762" name="self.model.layers.15.self_attn.v_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 1" offset="2943895672" size="20480" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3763" name="Convert_387299" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3764" name="self.model.layers.15.self_attn.v_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3765" name="self.model.layers.15.self_attn.v_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="1024, 40, 1" offset="2943916152" size="81920" /> + <output> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3766" name="self.model.layers.15.self_attn.v_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3767" name="Constant_387304" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795418528" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="3768" name="Reshape_387305" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="3769" name="__module.model.layers.15.self_attn.v_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="3770" name="__module.model.layers.15.self_attn.v_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="3771" name="self.model.layers.15.self_attn.v_proj.bias" type="Const" version="opset1"> + <data element_type="bf16" shape="1024" offset="2943998072" size="2048" /> + <output> + <port id="0" precision="BF16" names="self.model.layers.15.self_attn.v_proj.bias"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="3772" name="__module.model.layers.15.self_attn.v_proj/prim::PythonOp/ConvertLike_1" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="BF16"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="3773" name="__module.model.layers.15.self_attn.v_proj/prim::PythonOp/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2913,value_states.31"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="3774" name="Constant_301790" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420592" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3775" name="__module.model.layers.15.self_attn/aten::view/Reshape_2" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2921"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3776" name="__module.model.layers.15.self_attn/aten::transpose/ScatterElementsUpdate_2" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3777" name="__module.model.layers.15.self_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2922"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3778" name="__module.model.layers.15.self_attn/aten::cat/Concat_3" type="Concat" version="opset1"> + <data axis="-2" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="present.15.value"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3779" name="__module.model.layers.15.self_attn/aten::unsqueeze/Unsqueeze_3" type="Unsqueeze" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="FP32" names="2984,2985,2986"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3780" name="__module.model.layers.15.self_attn/aten::size/ShapeOf_10" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3781" name="Constant_302175" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3782" name="__module.model.layers.15.self_attn/aten::size/Constant_11" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="3783" name="__module.model.layers.15.self_attn/aten::size/Gather_11" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="2978"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3784" name="Constant_268392" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="795420624" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3785" name="Constant_276726" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795420632" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="3786" name="Constant_276727" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="3787" name="Gather_276728" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="3788" name="__module.model.layers.15.self_attn/prim::ListConstruct/Concat_5" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="4" precision="I64" names="2987"> + <dim>5</dim> + </port> + </output> + </layer> + <layer id="3789" name="__module.model.layers.15.self_attn/aten::expand/Broadcast_1" type="Broadcast" version="opset3"> + <data mode="bidirectional" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>5</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2988,hidden_states.465"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3790" name="Constant_301791" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420648" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3791" name="__module.model.layers.15.self_attn/aten::reshape/Reshape_1" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2992"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3792" name="__module.model.layers.15.self_attn/aten::slice/Reshape_60" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3793" name="ShapeOf_298870" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3794" name="Constant_298871" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694668" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3795" name="Constant_298872" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="3796" name="Gather_298873" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3797" name="ShapeOf_298874" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3798" name="Constant_298875" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694668" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3799" name="Constant_298876" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="3800" name="Gather_298877" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3801" name="Add_298878" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64" names="2993"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3802" name="__module.model.layers.15.self_attn/aten::slice/Reshape_62" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3803" name="__module.model.layers.15.self_attn/aten::slice/Reshape_63" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3804" name="__module.model.layers.15.self_attn/aten::slice/Slice_15" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="2997"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="3805" name="__module.model.layers.15.self_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> + <data causal="false" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="2998,attn_output.61"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3806" name="__module.model.layers.15.self_attn/aten::transpose/ScatterElementsUpdate_3" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3807" name="__module.model.layers.15.self_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="2999"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3808" name="Constant_301792" type="Const" version="opset1"> + <data element_type="i64" shape="3" offset="798146608" size="24" /> + <output> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="3809" name="__module.model.layers.15.self_attn/aten::view/Reshape_3" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>3</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3002"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="3810" name="self.model.layers.15.self_attn.o_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 128" offset="2944000120" size="13107200" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3811" name="Convert_386337" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3812" name="self.model.layers.15.self_attn.o_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 1" offset="2957107320" size="102400" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3813" name="Convert_386339" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3814" name="self.model.layers.15.self_attn.o_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3815" name="self.model.layers.15.self_attn.o_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="5120, 40, 1" offset="2957209720" size="409600" /> + <output> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3816" name="self.model.layers.15.self_attn.o_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3817" name="Constant_386344" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="792684080" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="3818" name="Reshape_386345" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="3819" name="__module.model.layers.15.self_attn.o_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="3820" name="__module.model.layers.15.self_attn.o_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3004,3006,hidden_states.467"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="3821" name="__module.model.layers.15/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3009,3011,3022,hidden_states.469,hidden_states.471"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="3822" name="Constant_290207" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 5120" offset="2957619320" size="20480" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="3823" name="Constant_290206" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064860" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3824" name="Constant_290204" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064864" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3825" name="__module.model.layers.15.post_attention_layernorm/aten::pow/Power" type="Power" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3012"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="3826" name="Constant_11204" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64" names="3013"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3827" name="__module.model.layers.15.post_attention_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> + <data keep_dims="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3014,variance.63"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3828" name="Constant_290205" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064876" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3829" name="__module.model.layers.15.post_attention_layernorm/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3015"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3830" name="__module.model.layers.15.post_attention_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3831" name="__module.model.layers.15.post_attention_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3016"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3832" name="__module.model.layers.15.post_attention_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3017,3018,hidden_states.473,hidden_states.475"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="3833" name="__module.model.layers.15.post_attention_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3019,3021"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="3834" name="self.model.layers.15.mlp.gate_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 128" offset="2957639800" size="35389440" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3835" name="Convert_385047" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3836" name="self.model.layers.15.mlp.gate_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 1" offset="2993029240" size="276480" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3837" name="Convert_385049" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3838" name="self.model.layers.15.mlp.gate_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3839" name="self.model.layers.15.mlp.gate_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="13824, 40, 1" offset="2993305720" size="1105920" /> + <output> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3840" name="self.model.layers.15.mlp.gate_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3841" name="Constant_385054" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="848558152" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="3842" name="Reshape_385055" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="3843" name="__module.model.layers.15.mlp.gate_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="3844" name="__module.model.layers.15.mlp.gate_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3027,input.31"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="3845" name="__module.model.layers.15.mlp.act_fn/aten::silu/Swish" type="Swish" version="opset4"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="3028"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="3846" name="self.model.layers.15.mlp.up_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 128" offset="2994411640" size="35389440" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3847" name="Convert_385037" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3848" name="self.model.layers.15.mlp.up_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 1" offset="3029801080" size="276480" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3849" name="Convert_385039" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3850" name="self.model.layers.15.mlp.up_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3851" name="self.model.layers.15.mlp.up_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="13824, 40, 1" offset="3030077560" size="1105920" /> + <output> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3852" name="self.model.layers.15.mlp.up_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3853" name="Constant_385044" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="848558152" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="3854" name="Reshape_385045" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="3855" name="__module.model.layers.15.mlp.up_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="3856" name="__module.model.layers.15.mlp.up_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3030"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="3857" name="__module.model.layers.15.mlp/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3031"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="3858" name="self.model.layers.15.mlp.down_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 108, 128" offset="3031183480" size="35389440" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3859" name="Convert_385057" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3860" name="self.model.layers.15.mlp.down_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 108, 1" offset="3066572920" size="276480" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3861" name="Convert_385059" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3862" name="self.model.layers.15.mlp.down_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3863" name="self.model.layers.15.mlp.down_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="5120, 108, 1" offset="3066849400" size="1105920" /> + <output> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3864" name="self.model.layers.15.mlp.down_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3865" name="Constant_385064" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="922101848" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="3866" name="Reshape_385065" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="3867" name="__module.model.layers.15.mlp.down_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="3868" name="__module.model.layers.15.mlp.down_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3033,hidden_states.477"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="3869" name="__module.model.layers.15/aten::add/Add_1" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3034,3036,3044,3055,hidden_states.479,hidden_states.481"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="3870" name="Constant_290211" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 5120" offset="3067955320" size="20480" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="3871" name="Constant_290210" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064860" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3872" name="Constant_290208" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064864" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3873" name="__module.model.layers.16.input_layernorm/aten::pow/Power" type="Power" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3045"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="3874" name="Constant_11278" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64" names="3046"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3875" name="__module.model.layers.16.input_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> + <data keep_dims="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3047,variance.65"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3876" name="Constant_290209" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064876" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3877" name="__module.model.layers.16.input_layernorm/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3048"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3878" name="__module.model.layers.16.input_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3879" name="__module.model.layers.16.input_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3049"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3880" name="__module.model.layers.16.input_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3050,3051,hidden_states.483,hidden_states.485"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="3881" name="__module.model.layers.16.input_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3052,3054,hidden_states.487"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="3882" name="self.model.layers.16.self_attn.q_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 128" offset="3067975800" size="13107200" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3883" name="Convert_386347" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3884" name="self.model.layers.16.self_attn.q_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 1" offset="3081083000" size="102400" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3885" name="Convert_386349" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3886" name="self.model.layers.16.self_attn.q_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3887" name="self.model.layers.16.self_attn.q_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="5120, 40, 1" offset="3081185400" size="409600" /> + <output> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3888" name="self.model.layers.16.self_attn.q_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3889" name="Constant_386354" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="792684080" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="3890" name="Reshape_386355" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="3891" name="__module.model.layers.16.self_attn.q_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="3892" name="__module.model.layers.16.self_attn.q_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="3893" name="self.model.layers.16.self_attn.q_proj.bias" type="Const" version="opset1"> + <data element_type="bf16" shape="5120" offset="3081595000" size="10240" /> + <output> + <port id="0" precision="BF16" names="self.model.layers.16.self_attn.q_proj.bias"> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="3894" name="__module.model.layers.16.self_attn.q_proj/prim::PythonOp/ConvertLike_1" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="BF16"> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="3895" name="__module.model.layers.16.self_attn.q_proj/prim::PythonOp/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3064,query_states.33"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="3896" name="Constant_301793" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="792694336" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3897" name="__module.model.layers.16.self_attn/aten::view/Reshape" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3072"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3898" name="__module.model.layers.16.self_attn/aten::transpose/ScatterElementsUpdate" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3899" name="__module.model.layers.16.self_attn/aten::transpose/Transpose" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3073,q.33"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3900" name="__module.model.layers.16.self_attn/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3082"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3901" name="__module.model.layers.16.self_attn/aten::size/ShapeOf_3" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3902" name="__module.model.layers.16.self_attn/aten::size/Constant_3" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="3903" name="__module.model.layers.16.self_attn/aten::size/Gather_3" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="3083,3088" /> + </output> + </layer> + <layer id="3904" name="__module.model.layers.16.self_attn/aten::floor_divide/Divide_1" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" /> + </output> + </layer> + <layer id="3905" name="__module.model.layers.16.self_attn/aten::floor_divide/Floor_1" type="Floor" version="opset1"> + <input> + <port id="0" precision="I64" /> + </input> + <output> + <port id="1" precision="I64" names="3085,3086,3090,3091" /> + </output> + </layer> + <layer id="3906" name="Constant_220785" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3907" name="__module.model.layers.16.self_attn/aten::slice/Reshape_5" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3908" name="__module.model.layers.16.self_attn/aten::slice/Reshape_1" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694676" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3909" name="__module.model.layers.16.self_attn/aten::slice/Reshape_2" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3910" name="__module.model.layers.16.self_attn/aten::slice/Reshape_3" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3911" name="__module.model.layers.16.self_attn/aten::slice/Slice" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="3092,x2.65"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="3912" name="Constant_290212" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1, 1" offset="792694684" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3913" name="__module.model.layers.16.self_attn/aten::neg/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3093"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="3914" name="__module.model.layers.16.self_attn/aten::slice/Reshape_4" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3915" name="__module.model.layers.16.self_attn/aten::slice/Reshape_6" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3916" name="__module.model.layers.16.self_attn/aten::slice/Reshape_7" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3917" name="__module.model.layers.16.self_attn/aten::slice/Slice_1" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="3087"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="3918" name="__module.model.layers.16.self_attn/aten::cat/Concat" type="Concat" version="opset1"> + <data axis="-1" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3095"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3919" name="__module.model.layers.16.self_attn/aten::mul/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3096"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3920" name="__module.model.layers.16.self_attn/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3097"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3921" name="Constant_341191" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="3922" name="Constant_341184" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="12" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3923" name="Constant_341186" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3924" name="Constant_341188" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="20" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3925" name="Concat_341189" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3926" name="Broadcast_341192" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32" /> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3927" name="ReadValue_333108" type="ReadValue" version="opset6"> + <data variable_id="past_key_values.16.keypresent.16.key" variable_type="f32" variable_shape="?,8,?,128" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="past_key_values.16.key"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3928" name="Constant_325405" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="3929" name="Gather_325406" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3930" name="self.model.layers.16.self_attn.k_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 128" offset="3081605240" size="2621440" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3931" name="Convert_387307" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3932" name="self.model.layers.16.self_attn.k_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 1" offset="3084226680" size="20480" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3933" name="Convert_387309" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3934" name="self.model.layers.16.self_attn.k_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3935" name="self.model.layers.16.self_attn.k_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="1024, 40, 1" offset="3084247160" size="81920" /> + <output> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3936" name="self.model.layers.16.self_attn.k_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3937" name="Constant_387314" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795418528" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="3938" name="Reshape_387315" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="3939" name="__module.model.layers.16.self_attn.k_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="3940" name="__module.model.layers.16.self_attn.k_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="3941" name="self.model.layers.16.self_attn.k_proj.bias" type="Const" version="opset1"> + <data element_type="bf16" shape="1024" offset="3084329080" size="2048" /> + <output> + <port id="0" precision="BF16" names="self.model.layers.16.self_attn.k_proj.bias"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="3942" name="__module.model.layers.16.self_attn.k_proj/prim::PythonOp/ConvertLike_1" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="BF16"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="3943" name="__module.model.layers.16.self_attn.k_proj/prim::PythonOp/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3067,key_states.69"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="3944" name="Constant_301794" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420592" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3945" name="__module.model.layers.16.self_attn/aten::view/Reshape_1" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3075"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3946" name="__module.model.layers.16.self_attn/aten::transpose/ScatterElementsUpdate_1" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3947" name="__module.model.layers.16.self_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3076,k.33"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3948" name="__module.model.layers.16.self_attn/aten::mul/Multiply_2" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3098"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3949" name="__module.model.layers.16.self_attn/aten::size/ShapeOf_5" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3950" name="__module.model.layers.16.self_attn/aten::size/Constant_5" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="3951" name="__module.model.layers.16.self_attn/aten::size/Gather_5" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="3099,3104" /> + </output> + </layer> + <layer id="3952" name="__module.model.layers.16.self_attn/aten::floor_divide/Divide_3" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" /> + </output> + </layer> + <layer id="3953" name="__module.model.layers.16.self_attn/aten::floor_divide/Floor_3" type="Floor" version="opset1"> + <input> + <port id="0" precision="I64" /> + </input> + <output> + <port id="1" precision="I64" names="3101,3102,3106,3107" /> + </output> + </layer> + <layer id="3954" name="Constant_220786" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3955" name="__module.model.layers.16.self_attn/aten::slice/Reshape_13" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3956" name="__module.model.layers.16.self_attn/aten::slice/Reshape_9" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694676" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3957" name="__module.model.layers.16.self_attn/aten::slice/Reshape_10" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3958" name="__module.model.layers.16.self_attn/aten::slice/Reshape_11" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3959" name="__module.model.layers.16.self_attn/aten::slice/Slice_2" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="3108,x2.67"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="3960" name="Constant_290213" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1, 1" offset="792694684" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3961" name="__module.model.layers.16.self_attn/aten::neg/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3109"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="3962" name="__module.model.layers.16.self_attn/aten::slice/Reshape_12" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3963" name="__module.model.layers.16.self_attn/aten::slice/Reshape_14" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3964" name="__module.model.layers.16.self_attn/aten::slice/Reshape_15" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3965" name="__module.model.layers.16.self_attn/aten::slice/Slice_3" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="3103"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="3966" name="__module.model.layers.16.self_attn/aten::cat/Concat_1" type="Concat" version="opset1"> + <data axis="-1" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3111"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3967" name="__module.model.layers.16.self_attn/aten::mul/Multiply_3" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3112"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3968" name="__module.model.layers.16.self_attn/aten::add/Add_1" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3113"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3969" name="__module.model.layers.16.self_attn/aten::cat/Concat_2" type="Concat" version="opset1"> + <data axis="-2" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="present.16.key"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3970" name="__module.model.layers.16.self_attn/aten::unsqueeze/Unsqueeze_2" type="Unsqueeze" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="FP32" names="3125,3126,3127"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3971" name="__module.model.layers.16.self_attn/aten::size/ShapeOf_6" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3972" name="Constant_302444" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="938477672" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="3973" name="Constant_302445" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="3974" name="Gather_302446" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="3975" name="Constant_268410" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="795420624" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3976" name="Constant_276751" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795420632" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="3977" name="Constant_276752" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="3978" name="Gather_276753" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="3979" name="__module.model.layers.16.self_attn/prim::ListConstruct/Concat_2" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="3" precision="I64" names="3128"> + <dim>5</dim> + </port> + </output> + </layer> + <layer id="3980" name="__module.model.layers.16.self_attn/aten::expand/Broadcast" type="Broadcast" version="opset3"> + <data mode="bidirectional" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>5</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3129,hidden_states.491"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3981" name="Constant_301795" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420648" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3982" name="__module.model.layers.16.self_attn/aten::reshape/Reshape" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3133,key_states.71"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3983" name="Constant_341204" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="3984" name="Constant_341197" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="12" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3985" name="Constant_341199" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3986" name="Constant_341201" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="20" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3987" name="Concat_341202" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="3988" name="Broadcast_341205" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32" /> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3989" name="ReadValue_333110" type="ReadValue" version="opset6"> + <data variable_id="past_key_values.16.valuepresent.16.value" variable_type="f32" variable_shape="?,8,?,128" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="past_key_values.16.value"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3990" name="Constant_325408" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="3991" name="Gather_325409" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3992" name="self.model.layers.16.self_attn.v_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 128" offset="3084331128" size="2621440" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3993" name="Convert_387317" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3994" name="self.model.layers.16.self_attn.v_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 1" offset="3086952568" size="20480" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3995" name="Convert_387319" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3996" name="self.model.layers.16.self_attn.v_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3997" name="self.model.layers.16.self_attn.v_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="1024, 40, 1" offset="3086973048" size="81920" /> + <output> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="3998" name="self.model.layers.16.self_attn.v_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="3999" name="Constant_387324" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795418528" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="4000" name="Reshape_387325" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="4001" name="__module.model.layers.16.self_attn.v_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="4002" name="__module.model.layers.16.self_attn.v_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="4003" name="self.model.layers.16.self_attn.v_proj.bias" type="Const" version="opset1"> + <data element_type="bf16" shape="1024" offset="3087054968" size="2048" /> + <output> + <port id="0" precision="BF16" names="self.model.layers.16.self_attn.v_proj.bias"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="4004" name="__module.model.layers.16.self_attn.v_proj/prim::PythonOp/ConvertLike_1" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="BF16"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="4005" name="__module.model.layers.16.self_attn.v_proj/prim::PythonOp/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3070,value_states.33"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="4006" name="Constant_301796" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420592" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4007" name="__module.model.layers.16.self_attn/aten::view/Reshape_2" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3078"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4008" name="__module.model.layers.16.self_attn/aten::transpose/ScatterElementsUpdate_2" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4009" name="__module.model.layers.16.self_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3079"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4010" name="__module.model.layers.16.self_attn/aten::cat/Concat_3" type="Concat" version="opset1"> + <data axis="-2" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="present.16.value"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4011" name="__module.model.layers.16.self_attn/aten::unsqueeze/Unsqueeze_3" type="Unsqueeze" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="FP32" names="3141,3142,3143"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4012" name="__module.model.layers.16.self_attn/aten::size/ShapeOf_10" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4013" name="Constant_302181" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4014" name="__module.model.layers.16.self_attn/aten::size/Constant_11" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="4015" name="__module.model.layers.16.self_attn/aten::size/Gather_11" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="3135"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4016" name="Constant_268428" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="795420624" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4017" name="Constant_276761" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795420632" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="4018" name="Constant_276762" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="4019" name="Gather_276763" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="4020" name="__module.model.layers.16.self_attn/prim::ListConstruct/Concat_5" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="4" precision="I64" names="3144"> + <dim>5</dim> + </port> + </output> + </layer> + <layer id="4021" name="__module.model.layers.16.self_attn/aten::expand/Broadcast_1" type="Broadcast" version="opset3"> + <data mode="bidirectional" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>5</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3145,hidden_states.495"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4022" name="Constant_301797" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420648" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4023" name="__module.model.layers.16.self_attn/aten::reshape/Reshape_1" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3149"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4024" name="__module.model.layers.16.self_attn/aten::slice/Reshape_60" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4025" name="ShapeOf_298956" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4026" name="Constant_298957" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694668" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4027" name="Constant_298958" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="4028" name="Gather_298959" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4029" name="ShapeOf_298960" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4030" name="Constant_298961" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694668" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4031" name="Constant_298962" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="4032" name="Gather_298963" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4033" name="Add_298964" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64" names="3150"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4034" name="__module.model.layers.16.self_attn/aten::slice/Reshape_62" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4035" name="__module.model.layers.16.self_attn/aten::slice/Reshape_63" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4036" name="__module.model.layers.16.self_attn/aten::slice/Slice_15" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="3154"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="4037" name="__module.model.layers.16.self_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> + <data causal="false" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="3155,attn_output.65"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4038" name="__module.model.layers.16.self_attn/aten::transpose/ScatterElementsUpdate_3" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4039" name="__module.model.layers.16.self_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3156"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4040" name="Constant_301798" type="Const" version="opset1"> + <data element_type="i64" shape="3" offset="798146608" size="24" /> + <output> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="4041" name="__module.model.layers.16.self_attn/aten::view/Reshape_3" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>3</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3159"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="4042" name="self.model.layers.16.self_attn.o_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 128" offset="3087057016" size="13107200" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4043" name="Convert_386357" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4044" name="self.model.layers.16.self_attn.o_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 1" offset="3100164216" size="102400" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4045" name="Convert_386359" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4046" name="self.model.layers.16.self_attn.o_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4047" name="self.model.layers.16.self_attn.o_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="5120, 40, 1" offset="3100266616" size="409600" /> + <output> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4048" name="self.model.layers.16.self_attn.o_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4049" name="Constant_386364" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="792684080" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="4050" name="Reshape_386365" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="4051" name="__module.model.layers.16.self_attn.o_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="4052" name="__module.model.layers.16.self_attn.o_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3161,3163,hidden_states.497"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="4053" name="__module.model.layers.16/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3166,3168,3179,hidden_states.499,hidden_states.501"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="4054" name="Constant_290217" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 5120" offset="3100676216" size="20480" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="4055" name="Constant_290216" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064860" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4056" name="Constant_290214" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064864" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4057" name="__module.model.layers.16.post_attention_layernorm/aten::pow/Power" type="Power" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3169"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="4058" name="Constant_11876" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64" names="3170"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4059" name="__module.model.layers.16.post_attention_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> + <data keep_dims="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3171,variance.67"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4060" name="Constant_290215" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064876" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4061" name="__module.model.layers.16.post_attention_layernorm/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3172"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4062" name="__module.model.layers.16.post_attention_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4063" name="__module.model.layers.16.post_attention_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3173"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4064" name="__module.model.layers.16.post_attention_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3174,3175,hidden_states.503,hidden_states.505"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="4065" name="__module.model.layers.16.post_attention_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3176,3178"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="4066" name="self.model.layers.16.mlp.gate_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 128" offset="3100696696" size="35389440" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4067" name="Convert_385077" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4068" name="self.model.layers.16.mlp.gate_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 1" offset="3136086136" size="276480" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4069" name="Convert_385079" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4070" name="self.model.layers.16.mlp.gate_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4071" name="self.model.layers.16.mlp.gate_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="13824, 40, 1" offset="3136362616" size="1105920" /> + <output> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4072" name="self.model.layers.16.mlp.gate_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4073" name="Constant_385084" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="848558152" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="4074" name="Reshape_385085" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="4075" name="__module.model.layers.16.mlp.gate_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="4076" name="__module.model.layers.16.mlp.gate_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3184,input.33"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="4077" name="__module.model.layers.16.mlp.act_fn/aten::silu/Swish" type="Swish" version="opset4"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="3185"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="4078" name="self.model.layers.16.mlp.up_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 128" offset="3137468536" size="35389440" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4079" name="Convert_385067" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4080" name="self.model.layers.16.mlp.up_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 1" offset="3172857976" size="276480" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4081" name="Convert_385069" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4082" name="self.model.layers.16.mlp.up_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4083" name="self.model.layers.16.mlp.up_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="13824, 40, 1" offset="3173134456" size="1105920" /> + <output> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4084" name="self.model.layers.16.mlp.up_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4085" name="Constant_385074" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="848558152" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="4086" name="Reshape_385075" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="4087" name="__module.model.layers.16.mlp.up_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="4088" name="__module.model.layers.16.mlp.up_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3187"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="4089" name="__module.model.layers.16.mlp/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3188"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="4090" name="self.model.layers.16.mlp.down_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 108, 128" offset="3174240376" size="35389440" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4091" name="Convert_385087" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4092" name="self.model.layers.16.mlp.down_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 108, 1" offset="3209629816" size="276480" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4093" name="Convert_385089" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4094" name="self.model.layers.16.mlp.down_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4095" name="self.model.layers.16.mlp.down_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="5120, 108, 1" offset="3209906296" size="1105920" /> + <output> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4096" name="self.model.layers.16.mlp.down_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4097" name="Constant_385094" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="922101848" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="4098" name="Reshape_385095" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="4099" name="__module.model.layers.16.mlp.down_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="4100" name="__module.model.layers.16.mlp.down_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3190,hidden_states.507"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="4101" name="__module.model.layers.16/aten::add/Add_1" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3191,3193,3201,3212,hidden_states.509,hidden_states.511"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="4102" name="Constant_290221" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 5120" offset="3211012216" size="20480" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="4103" name="Constant_290220" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064860" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4104" name="Constant_290218" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064864" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4105" name="__module.model.layers.17.input_layernorm/aten::pow/Power" type="Power" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3202"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="4106" name="Constant_11950" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64" names="3203"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4107" name="__module.model.layers.17.input_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> + <data keep_dims="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3204,variance.69"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4108" name="Constant_290219" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064876" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4109" name="__module.model.layers.17.input_layernorm/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3205"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4110" name="__module.model.layers.17.input_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4111" name="__module.model.layers.17.input_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3206"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4112" name="__module.model.layers.17.input_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3207,3208,hidden_states.513,hidden_states.515"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="4113" name="__module.model.layers.17.input_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3209,3211,hidden_states.517"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="4114" name="self.model.layers.17.self_attn.q_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 128" offset="3211032696" size="13107200" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4115" name="Convert_386367" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4116" name="self.model.layers.17.self_attn.q_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 1" offset="3224139896" size="102400" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4117" name="Convert_386369" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4118" name="self.model.layers.17.self_attn.q_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4119" name="self.model.layers.17.self_attn.q_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="5120, 40, 1" offset="3224242296" size="409600" /> + <output> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4120" name="self.model.layers.17.self_attn.q_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4121" name="Constant_386374" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="792684080" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="4122" name="Reshape_386375" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="4123" name="__module.model.layers.17.self_attn.q_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="4124" name="__module.model.layers.17.self_attn.q_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="4125" name="self.model.layers.17.self_attn.q_proj.bias" type="Const" version="opset1"> + <data element_type="bf16" shape="5120" offset="3224651896" size="10240" /> + <output> + <port id="0" precision="BF16" names="self.model.layers.17.self_attn.q_proj.bias"> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="4126" name="__module.model.layers.17.self_attn.q_proj/prim::PythonOp/ConvertLike_1" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="BF16"> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="4127" name="__module.model.layers.17.self_attn.q_proj/prim::PythonOp/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3221,query_states.35"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="4128" name="Constant_301799" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="792694336" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4129" name="__module.model.layers.17.self_attn/aten::view/Reshape" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3229"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4130" name="__module.model.layers.17.self_attn/aten::transpose/ScatterElementsUpdate" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4131" name="__module.model.layers.17.self_attn/aten::transpose/Transpose" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3230,q.35"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4132" name="__module.model.layers.17.self_attn/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3239"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4133" name="__module.model.layers.17.self_attn/aten::size/ShapeOf_3" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4134" name="__module.model.layers.17.self_attn/aten::size/Constant_3" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="4135" name="__module.model.layers.17.self_attn/aten::size/Gather_3" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="3240,3245" /> + </output> + </layer> + <layer id="4136" name="__module.model.layers.17.self_attn/aten::floor_divide/Divide_1" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" /> + </output> + </layer> + <layer id="4137" name="__module.model.layers.17.self_attn/aten::floor_divide/Floor_1" type="Floor" version="opset1"> + <input> + <port id="0" precision="I64" /> + </input> + <output> + <port id="1" precision="I64" names="3242,3243,3247,3248" /> + </output> + </layer> + <layer id="4138" name="Constant_220800" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4139" name="__module.model.layers.17.self_attn/aten::slice/Reshape_5" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4140" name="__module.model.layers.17.self_attn/aten::slice/Reshape_1" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694676" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4141" name="__module.model.layers.17.self_attn/aten::slice/Reshape_2" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4142" name="__module.model.layers.17.self_attn/aten::slice/Reshape_3" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4143" name="__module.model.layers.17.self_attn/aten::slice/Slice" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="3249,x2.69"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="4144" name="Constant_290222" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1, 1" offset="792694684" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4145" name="__module.model.layers.17.self_attn/aten::neg/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3250"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="4146" name="__module.model.layers.17.self_attn/aten::slice/Reshape_4" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4147" name="__module.model.layers.17.self_attn/aten::slice/Reshape_6" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4148" name="__module.model.layers.17.self_attn/aten::slice/Reshape_7" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4149" name="__module.model.layers.17.self_attn/aten::slice/Slice_1" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="3244"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="4150" name="__module.model.layers.17.self_attn/aten::cat/Concat" type="Concat" version="opset1"> + <data axis="-1" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3252"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4151" name="__module.model.layers.17.self_attn/aten::mul/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3253"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4152" name="__module.model.layers.17.self_attn/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3254"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4153" name="Constant_341217" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="4154" name="Constant_341210" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="12" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4155" name="Constant_341212" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4156" name="Constant_341214" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="20" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4157" name="Concat_341215" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4158" name="Broadcast_341218" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32" /> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4159" name="ReadValue_333112" type="ReadValue" version="opset6"> + <data variable_id="past_key_values.17.keypresent.17.key" variable_type="f32" variable_shape="?,8,?,128" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="past_key_values.17.key"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4160" name="Constant_325411" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="4161" name="Gather_325412" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4162" name="self.model.layers.17.self_attn.k_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 128" offset="3224662136" size="2621440" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4163" name="Convert_387327" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4164" name="self.model.layers.17.self_attn.k_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 1" offset="3227283576" size="20480" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4165" name="Convert_387329" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4166" name="self.model.layers.17.self_attn.k_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4167" name="self.model.layers.17.self_attn.k_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="1024, 40, 1" offset="3227304056" size="81920" /> + <output> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4168" name="self.model.layers.17.self_attn.k_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4169" name="Constant_387334" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795418528" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="4170" name="Reshape_387335" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="4171" name="__module.model.layers.17.self_attn.k_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="4172" name="__module.model.layers.17.self_attn.k_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="4173" name="self.model.layers.17.self_attn.k_proj.bias" type="Const" version="opset1"> + <data element_type="bf16" shape="1024" offset="3227385976" size="2048" /> + <output> + <port id="0" precision="BF16" names="self.model.layers.17.self_attn.k_proj.bias"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="4174" name="__module.model.layers.17.self_attn.k_proj/prim::PythonOp/ConvertLike_1" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="BF16"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="4175" name="__module.model.layers.17.self_attn.k_proj/prim::PythonOp/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3224,key_states.73"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="4176" name="Constant_301800" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420592" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4177" name="__module.model.layers.17.self_attn/aten::view/Reshape_1" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3232"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4178" name="__module.model.layers.17.self_attn/aten::transpose/ScatterElementsUpdate_1" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4179" name="__module.model.layers.17.self_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3233,k.35"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4180" name="__module.model.layers.17.self_attn/aten::mul/Multiply_2" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3255"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4181" name="__module.model.layers.17.self_attn/aten::size/ShapeOf_5" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4182" name="__module.model.layers.17.self_attn/aten::size/Constant_5" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="4183" name="__module.model.layers.17.self_attn/aten::size/Gather_5" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="3256,3261" /> + </output> + </layer> + <layer id="4184" name="__module.model.layers.17.self_attn/aten::floor_divide/Divide_3" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" /> + </output> + </layer> + <layer id="4185" name="__module.model.layers.17.self_attn/aten::floor_divide/Floor_3" type="Floor" version="opset1"> + <input> + <port id="0" precision="I64" /> + </input> + <output> + <port id="1" precision="I64" names="3258,3259,3263,3264" /> + </output> + </layer> + <layer id="4186" name="Constant_220801" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4187" name="__module.model.layers.17.self_attn/aten::slice/Reshape_13" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4188" name="__module.model.layers.17.self_attn/aten::slice/Reshape_9" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694676" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4189" name="__module.model.layers.17.self_attn/aten::slice/Reshape_10" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4190" name="__module.model.layers.17.self_attn/aten::slice/Reshape_11" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4191" name="__module.model.layers.17.self_attn/aten::slice/Slice_2" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="3265,x2.71"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="4192" name="Constant_290223" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1, 1" offset="792694684" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4193" name="__module.model.layers.17.self_attn/aten::neg/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3266"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="4194" name="__module.model.layers.17.self_attn/aten::slice/Reshape_12" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4195" name="__module.model.layers.17.self_attn/aten::slice/Reshape_14" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4196" name="__module.model.layers.17.self_attn/aten::slice/Reshape_15" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4197" name="__module.model.layers.17.self_attn/aten::slice/Slice_3" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="3260"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="4198" name="__module.model.layers.17.self_attn/aten::cat/Concat_1" type="Concat" version="opset1"> + <data axis="-1" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3268"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4199" name="__module.model.layers.17.self_attn/aten::mul/Multiply_3" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3269"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4200" name="__module.model.layers.17.self_attn/aten::add/Add_1" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3270"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4201" name="__module.model.layers.17.self_attn/aten::cat/Concat_2" type="Concat" version="opset1"> + <data axis="-2" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="present.17.key"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4202" name="__module.model.layers.17.self_attn/aten::unsqueeze/Unsqueeze_2" type="Unsqueeze" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="FP32" names="3282,3283,3284"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4203" name="__module.model.layers.17.self_attn/aten::size/ShapeOf_6" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4204" name="Constant_302449" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="938477672" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="4205" name="Constant_302450" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="4206" name="Gather_302451" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="4207" name="Constant_268446" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="795420624" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4208" name="Constant_276786" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795420632" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="4209" name="Constant_276787" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="4210" name="Gather_276788" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="4211" name="__module.model.layers.17.self_attn/prim::ListConstruct/Concat_2" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="3" precision="I64" names="3285"> + <dim>5</dim> + </port> + </output> + </layer> + <layer id="4212" name="__module.model.layers.17.self_attn/aten::expand/Broadcast" type="Broadcast" version="opset3"> + <data mode="bidirectional" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>5</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3286,hidden_states.521"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4213" name="Constant_301801" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420648" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4214" name="__module.model.layers.17.self_attn/aten::reshape/Reshape" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3290,key_states.75"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4215" name="Constant_341230" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="4216" name="Constant_341223" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="12" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4217" name="Constant_341225" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4218" name="Constant_341227" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="20" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4219" name="Concat_341228" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4220" name="Broadcast_341231" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32" /> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4221" name="ReadValue_333114" type="ReadValue" version="opset6"> + <data variable_id="past_key_values.17.valuepresent.17.value" variable_type="f32" variable_shape="?,8,?,128" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="past_key_values.17.value"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4222" name="Constant_325414" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="4223" name="Gather_325415" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4224" name="self.model.layers.17.self_attn.v_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 128" offset="3227388024" size="2621440" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4225" name="Convert_387337" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4226" name="self.model.layers.17.self_attn.v_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 1" offset="3230009464" size="20480" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4227" name="Convert_387339" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4228" name="self.model.layers.17.self_attn.v_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4229" name="self.model.layers.17.self_attn.v_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="1024, 40, 1" offset="3230029944" size="81920" /> + <output> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4230" name="self.model.layers.17.self_attn.v_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4231" name="Constant_387344" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795418528" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="4232" name="Reshape_387345" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="4233" name="__module.model.layers.17.self_attn.v_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="4234" name="__module.model.layers.17.self_attn.v_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="4235" name="self.model.layers.17.self_attn.v_proj.bias" type="Const" version="opset1"> + <data element_type="bf16" shape="1024" offset="3230111864" size="2048" /> + <output> + <port id="0" precision="BF16" names="self.model.layers.17.self_attn.v_proj.bias"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="4236" name="__module.model.layers.17.self_attn.v_proj/prim::PythonOp/ConvertLike_1" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="BF16"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="4237" name="__module.model.layers.17.self_attn.v_proj/prim::PythonOp/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3227,value_states.35"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="4238" name="Constant_301802" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420592" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4239" name="__module.model.layers.17.self_attn/aten::view/Reshape_2" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3235"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4240" name="__module.model.layers.17.self_attn/aten::transpose/ScatterElementsUpdate_2" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4241" name="__module.model.layers.17.self_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3236"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4242" name="__module.model.layers.17.self_attn/aten::cat/Concat_3" type="Concat" version="opset1"> + <data axis="-2" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="present.17.value"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4243" name="__module.model.layers.17.self_attn/aten::unsqueeze/Unsqueeze_3" type="Unsqueeze" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="FP32" names="3298,3299,3300"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4244" name="__module.model.layers.17.self_attn/aten::size/ShapeOf_10" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4245" name="Constant_302187" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4246" name="__module.model.layers.17.self_attn/aten::size/Constant_11" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="4247" name="__module.model.layers.17.self_attn/aten::size/Gather_11" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="3292"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4248" name="Constant_268464" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="795420624" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4249" name="Constant_276796" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795420632" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="4250" name="Constant_276797" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="4251" name="Gather_276798" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="4252" name="__module.model.layers.17.self_attn/prim::ListConstruct/Concat_5" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="4" precision="I64" names="3301"> + <dim>5</dim> + </port> + </output> + </layer> + <layer id="4253" name="__module.model.layers.17.self_attn/aten::expand/Broadcast_1" type="Broadcast" version="opset3"> + <data mode="bidirectional" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>5</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3302,hidden_states.525"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4254" name="Constant_301803" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420648" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4255" name="__module.model.layers.17.self_attn/aten::reshape/Reshape_1" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3306"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4256" name="__module.model.layers.17.self_attn/aten::slice/Reshape_60" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4257" name="ShapeOf_299042" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4258" name="Constant_299043" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694668" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4259" name="Constant_299044" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="4260" name="Gather_299045" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4261" name="ShapeOf_299046" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4262" name="Constant_299047" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694668" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4263" name="Constant_299048" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="4264" name="Gather_299049" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4265" name="Add_299050" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64" names="3307"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4266" name="__module.model.layers.17.self_attn/aten::slice/Reshape_62" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4267" name="__module.model.layers.17.self_attn/aten::slice/Reshape_63" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4268" name="__module.model.layers.17.self_attn/aten::slice/Slice_15" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="3311"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="4269" name="__module.model.layers.17.self_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> + <data causal="false" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="3312,attn_output.69"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4270" name="__module.model.layers.17.self_attn/aten::transpose/ScatterElementsUpdate_3" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4271" name="__module.model.layers.17.self_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3313"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4272" name="Constant_301804" type="Const" version="opset1"> + <data element_type="i64" shape="3" offset="798146608" size="24" /> + <output> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="4273" name="__module.model.layers.17.self_attn/aten::view/Reshape_3" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>3</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3316"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="4274" name="self.model.layers.17.self_attn.o_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 128" offset="3230113912" size="13107200" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4275" name="Convert_386377" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4276" name="self.model.layers.17.self_attn.o_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 1" offset="3243221112" size="102400" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4277" name="Convert_386379" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4278" name="self.model.layers.17.self_attn.o_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4279" name="self.model.layers.17.self_attn.o_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="5120, 40, 1" offset="3243323512" size="409600" /> + <output> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4280" name="self.model.layers.17.self_attn.o_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4281" name="Constant_386384" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="792684080" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="4282" name="Reshape_386385" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="4283" name="__module.model.layers.17.self_attn.o_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="4284" name="__module.model.layers.17.self_attn.o_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3318,3320,hidden_states.527"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="4285" name="__module.model.layers.17/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3323,3325,3336,hidden_states.529,hidden_states.531"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="4286" name="Constant_290227" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 5120" offset="3243733112" size="20480" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="4287" name="Constant_290226" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064860" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4288" name="Constant_290224" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064864" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4289" name="__module.model.layers.17.post_attention_layernorm/aten::pow/Power" type="Power" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3326"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="4290" name="Constant_12548" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64" names="3327"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4291" name="__module.model.layers.17.post_attention_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> + <data keep_dims="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3328,variance.71"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4292" name="Constant_290225" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064876" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4293" name="__module.model.layers.17.post_attention_layernorm/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3329"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4294" name="__module.model.layers.17.post_attention_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4295" name="__module.model.layers.17.post_attention_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3330"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4296" name="__module.model.layers.17.post_attention_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3331,3332,hidden_states.533,hidden_states.535"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="4297" name="__module.model.layers.17.post_attention_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3333,3335"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="4298" name="self.model.layers.17.mlp.gate_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 128" offset="3243753592" size="35389440" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4299" name="Convert_385107" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4300" name="self.model.layers.17.mlp.gate_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 1" offset="3279143032" size="276480" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4301" name="Convert_385109" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4302" name="self.model.layers.17.mlp.gate_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4303" name="self.model.layers.17.mlp.gate_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="13824, 40, 1" offset="3279419512" size="1105920" /> + <output> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4304" name="self.model.layers.17.mlp.gate_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4305" name="Constant_385114" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="848558152" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="4306" name="Reshape_385115" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="4307" name="__module.model.layers.17.mlp.gate_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="4308" name="__module.model.layers.17.mlp.gate_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3341,input.35"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="4309" name="__module.model.layers.17.mlp.act_fn/aten::silu/Swish" type="Swish" version="opset4"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="3342"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="4310" name="self.model.layers.17.mlp.up_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 128" offset="3280525432" size="35389440" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4311" name="Convert_385097" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4312" name="self.model.layers.17.mlp.up_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 1" offset="3315914872" size="276480" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4313" name="Convert_385099" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4314" name="self.model.layers.17.mlp.up_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4315" name="self.model.layers.17.mlp.up_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="13824, 40, 1" offset="3316191352" size="1105920" /> + <output> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4316" name="self.model.layers.17.mlp.up_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4317" name="Constant_385104" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="848558152" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="4318" name="Reshape_385105" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="4319" name="__module.model.layers.17.mlp.up_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="4320" name="__module.model.layers.17.mlp.up_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3344"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="4321" name="__module.model.layers.17.mlp/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3345"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="4322" name="self.model.layers.17.mlp.down_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 108, 128" offset="3317297272" size="35389440" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4323" name="Convert_385117" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4324" name="self.model.layers.17.mlp.down_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 108, 1" offset="3352686712" size="276480" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4325" name="Convert_385119" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4326" name="self.model.layers.17.mlp.down_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4327" name="self.model.layers.17.mlp.down_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="5120, 108, 1" offset="3352963192" size="1105920" /> + <output> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4328" name="self.model.layers.17.mlp.down_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4329" name="Constant_385124" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="922101848" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="4330" name="Reshape_385125" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="4331" name="__module.model.layers.17.mlp.down_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="4332" name="__module.model.layers.17.mlp.down_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3347,hidden_states.537"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="4333" name="__module.model.layers.17/aten::add/Add_1" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3348,3350,3358,3369,hidden_states.539,hidden_states.541"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="4334" name="Constant_290231" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 5120" offset="3354069112" size="20480" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="4335" name="Constant_290230" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064860" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4336" name="Constant_290228" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064864" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4337" name="__module.model.layers.18.input_layernorm/aten::pow/Power" type="Power" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3359"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="4338" name="Constant_12622" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64" names="3360"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4339" name="__module.model.layers.18.input_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> + <data keep_dims="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3361,variance.73"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4340" name="Constant_290229" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064876" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4341" name="__module.model.layers.18.input_layernorm/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3362"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4342" name="__module.model.layers.18.input_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4343" name="__module.model.layers.18.input_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3363"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4344" name="__module.model.layers.18.input_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3364,3365,hidden_states.543,hidden_states.545"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="4345" name="__module.model.layers.18.input_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3366,3368,hidden_states.547"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="4346" name="self.model.layers.18.self_attn.q_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 128" offset="3354089592" size="13107200" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4347" name="Convert_386387" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4348" name="self.model.layers.18.self_attn.q_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 1" offset="3367196792" size="102400" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4349" name="Convert_386389" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4350" name="self.model.layers.18.self_attn.q_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4351" name="self.model.layers.18.self_attn.q_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="5120, 40, 1" offset="3367299192" size="409600" /> + <output> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4352" name="self.model.layers.18.self_attn.q_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4353" name="Constant_386394" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="792684080" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="4354" name="Reshape_386395" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="4355" name="__module.model.layers.18.self_attn.q_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="4356" name="__module.model.layers.18.self_attn.q_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="4357" name="self.model.layers.18.self_attn.q_proj.bias" type="Const" version="opset1"> + <data element_type="bf16" shape="5120" offset="3367708792" size="10240" /> + <output> + <port id="0" precision="BF16" names="self.model.layers.18.self_attn.q_proj.bias"> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="4358" name="__module.model.layers.18.self_attn.q_proj/prim::PythonOp/ConvertLike_1" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="BF16"> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="4359" name="__module.model.layers.18.self_attn.q_proj/prim::PythonOp/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3378,query_states.37"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="4360" name="Constant_301805" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="792694336" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4361" name="__module.model.layers.18.self_attn/aten::view/Reshape" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3386"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4362" name="__module.model.layers.18.self_attn/aten::transpose/ScatterElementsUpdate" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4363" name="__module.model.layers.18.self_attn/aten::transpose/Transpose" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3387,q.37"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4364" name="__module.model.layers.18.self_attn/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3396"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4365" name="__module.model.layers.18.self_attn/aten::size/ShapeOf_3" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4366" name="__module.model.layers.18.self_attn/aten::size/Constant_3" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="4367" name="__module.model.layers.18.self_attn/aten::size/Gather_3" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="3397,3402" /> + </output> + </layer> + <layer id="4368" name="__module.model.layers.18.self_attn/aten::floor_divide/Divide_1" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" /> + </output> + </layer> + <layer id="4369" name="__module.model.layers.18.self_attn/aten::floor_divide/Floor_1" type="Floor" version="opset1"> + <input> + <port id="0" precision="I64" /> + </input> + <output> + <port id="1" precision="I64" names="3399,3400,3404,3405" /> + </output> + </layer> + <layer id="4370" name="Constant_220815" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4371" name="__module.model.layers.18.self_attn/aten::slice/Reshape_5" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4372" name="__module.model.layers.18.self_attn/aten::slice/Reshape_1" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694676" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4373" name="__module.model.layers.18.self_attn/aten::slice/Reshape_2" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4374" name="__module.model.layers.18.self_attn/aten::slice/Reshape_3" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4375" name="__module.model.layers.18.self_attn/aten::slice/Slice" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="3406,x2.73"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="4376" name="Constant_290232" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1, 1" offset="792694684" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4377" name="__module.model.layers.18.self_attn/aten::neg/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3407"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="4378" name="__module.model.layers.18.self_attn/aten::slice/Reshape_4" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4379" name="__module.model.layers.18.self_attn/aten::slice/Reshape_6" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4380" name="__module.model.layers.18.self_attn/aten::slice/Reshape_7" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4381" name="__module.model.layers.18.self_attn/aten::slice/Slice_1" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="3401"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="4382" name="__module.model.layers.18.self_attn/aten::cat/Concat" type="Concat" version="opset1"> + <data axis="-1" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3409"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4383" name="__module.model.layers.18.self_attn/aten::mul/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3410"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4384" name="__module.model.layers.18.self_attn/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3411"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4385" name="Constant_341243" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="4386" name="Constant_341236" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="12" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4387" name="Constant_341238" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4388" name="Constant_341240" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="20" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4389" name="Concat_341241" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4390" name="Broadcast_341244" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32" /> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4391" name="ReadValue_333116" type="ReadValue" version="opset6"> + <data variable_id="past_key_values.18.keypresent.18.key" variable_type="f32" variable_shape="?,8,?,128" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="past_key_values.18.key"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4392" name="Constant_325417" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="4393" name="Gather_325418" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4394" name="self.model.layers.18.self_attn.k_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 128" offset="3367719032" size="2621440" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4395" name="Convert_387347" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4396" name="self.model.layers.18.self_attn.k_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 1" offset="3370340472" size="20480" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4397" name="Convert_387349" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4398" name="self.model.layers.18.self_attn.k_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4399" name="self.model.layers.18.self_attn.k_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="1024, 40, 1" offset="3370360952" size="81920" /> + <output> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4400" name="self.model.layers.18.self_attn.k_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4401" name="Constant_387354" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795418528" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="4402" name="Reshape_387355" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="4403" name="__module.model.layers.18.self_attn.k_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="4404" name="__module.model.layers.18.self_attn.k_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="4405" name="self.model.layers.18.self_attn.k_proj.bias" type="Const" version="opset1"> + <data element_type="bf16" shape="1024" offset="3370442872" size="2048" /> + <output> + <port id="0" precision="BF16" names="self.model.layers.18.self_attn.k_proj.bias"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="4406" name="__module.model.layers.18.self_attn.k_proj/prim::PythonOp/ConvertLike_1" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="BF16"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="4407" name="__module.model.layers.18.self_attn.k_proj/prim::PythonOp/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3381,key_states.77"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="4408" name="Constant_301806" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420592" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4409" name="__module.model.layers.18.self_attn/aten::view/Reshape_1" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3389"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4410" name="__module.model.layers.18.self_attn/aten::transpose/ScatterElementsUpdate_1" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4411" name="__module.model.layers.18.self_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3390,k.37"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4412" name="__module.model.layers.18.self_attn/aten::mul/Multiply_2" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3412"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4413" name="__module.model.layers.18.self_attn/aten::size/ShapeOf_5" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4414" name="__module.model.layers.18.self_attn/aten::size/Constant_5" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="4415" name="__module.model.layers.18.self_attn/aten::size/Gather_5" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="3413,3418" /> + </output> + </layer> + <layer id="4416" name="__module.model.layers.18.self_attn/aten::floor_divide/Divide_3" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" /> + </output> + </layer> + <layer id="4417" name="__module.model.layers.18.self_attn/aten::floor_divide/Floor_3" type="Floor" version="opset1"> + <input> + <port id="0" precision="I64" /> + </input> + <output> + <port id="1" precision="I64" names="3415,3416,3420,3421" /> + </output> + </layer> + <layer id="4418" name="Constant_220816" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4419" name="__module.model.layers.18.self_attn/aten::slice/Reshape_13" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4420" name="__module.model.layers.18.self_attn/aten::slice/Reshape_9" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694676" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4421" name="__module.model.layers.18.self_attn/aten::slice/Reshape_10" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4422" name="__module.model.layers.18.self_attn/aten::slice/Reshape_11" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4423" name="__module.model.layers.18.self_attn/aten::slice/Slice_2" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="3422,x2.75"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="4424" name="Constant_290233" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1, 1" offset="792694684" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4425" name="__module.model.layers.18.self_attn/aten::neg/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3423"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="4426" name="__module.model.layers.18.self_attn/aten::slice/Reshape_12" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4427" name="__module.model.layers.18.self_attn/aten::slice/Reshape_14" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4428" name="__module.model.layers.18.self_attn/aten::slice/Reshape_15" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4429" name="__module.model.layers.18.self_attn/aten::slice/Slice_3" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="3417"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="4430" name="__module.model.layers.18.self_attn/aten::cat/Concat_1" type="Concat" version="opset1"> + <data axis="-1" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3425"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4431" name="__module.model.layers.18.self_attn/aten::mul/Multiply_3" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3426"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4432" name="__module.model.layers.18.self_attn/aten::add/Add_1" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3427"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4433" name="__module.model.layers.18.self_attn/aten::cat/Concat_2" type="Concat" version="opset1"> + <data axis="-2" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="present.18.key"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4434" name="__module.model.layers.18.self_attn/aten::unsqueeze/Unsqueeze_2" type="Unsqueeze" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="FP32" names="3439,3440,3441"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4435" name="__module.model.layers.18.self_attn/aten::size/ShapeOf_6" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4436" name="Constant_302454" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="938477672" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="4437" name="Constant_302455" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="4438" name="Gather_302456" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="4439" name="Constant_268482" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="795420624" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4440" name="Constant_276821" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795420632" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="4441" name="Constant_276822" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="4442" name="Gather_276823" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="4443" name="__module.model.layers.18.self_attn/prim::ListConstruct/Concat_2" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="3" precision="I64" names="3442"> + <dim>5</dim> + </port> + </output> + </layer> + <layer id="4444" name="__module.model.layers.18.self_attn/aten::expand/Broadcast" type="Broadcast" version="opset3"> + <data mode="bidirectional" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>5</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3443,hidden_states.551"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4445" name="Constant_301807" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420648" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4446" name="__module.model.layers.18.self_attn/aten::reshape/Reshape" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3447,key_states.79"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4447" name="Constant_341256" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="4448" name="Constant_341249" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="12" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4449" name="Constant_341251" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4450" name="Constant_341253" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="20" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4451" name="Concat_341254" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4452" name="Broadcast_341257" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32" /> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4453" name="ReadValue_333118" type="ReadValue" version="opset6"> + <data variable_id="past_key_values.18.valuepresent.18.value" variable_type="f32" variable_shape="?,8,?,128" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="past_key_values.18.value"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4454" name="Constant_325420" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="4455" name="Gather_325421" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4456" name="self.model.layers.18.self_attn.v_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 128" offset="3370444920" size="2621440" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4457" name="Convert_387357" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4458" name="self.model.layers.18.self_attn.v_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 1" offset="3373066360" size="20480" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4459" name="Convert_387359" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4460" name="self.model.layers.18.self_attn.v_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4461" name="self.model.layers.18.self_attn.v_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="1024, 40, 1" offset="3373086840" size="81920" /> + <output> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4462" name="self.model.layers.18.self_attn.v_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4463" name="Constant_387364" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795418528" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="4464" name="Reshape_387365" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="4465" name="__module.model.layers.18.self_attn.v_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="4466" name="__module.model.layers.18.self_attn.v_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="4467" name="self.model.layers.18.self_attn.v_proj.bias" type="Const" version="opset1"> + <data element_type="bf16" shape="1024" offset="3373168760" size="2048" /> + <output> + <port id="0" precision="BF16" names="self.model.layers.18.self_attn.v_proj.bias"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="4468" name="__module.model.layers.18.self_attn.v_proj/prim::PythonOp/ConvertLike_1" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="BF16"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="4469" name="__module.model.layers.18.self_attn.v_proj/prim::PythonOp/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3384,value_states.37"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="4470" name="Constant_301808" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420592" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4471" name="__module.model.layers.18.self_attn/aten::view/Reshape_2" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3392"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4472" name="__module.model.layers.18.self_attn/aten::transpose/ScatterElementsUpdate_2" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4473" name="__module.model.layers.18.self_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3393"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4474" name="__module.model.layers.18.self_attn/aten::cat/Concat_3" type="Concat" version="opset1"> + <data axis="-2" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="present.18.value"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4475" name="__module.model.layers.18.self_attn/aten::unsqueeze/Unsqueeze_3" type="Unsqueeze" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="FP32" names="3455,3456,3457"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4476" name="__module.model.layers.18.self_attn/aten::size/ShapeOf_10" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4477" name="Constant_302193" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4478" name="__module.model.layers.18.self_attn/aten::size/Constant_11" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="4479" name="__module.model.layers.18.self_attn/aten::size/Gather_11" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="3449"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4480" name="Constant_268500" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="795420624" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4481" name="Constant_276831" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795420632" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="4482" name="Constant_276832" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="4483" name="Gather_276833" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="4484" name="__module.model.layers.18.self_attn/prim::ListConstruct/Concat_5" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="4" precision="I64" names="3458"> + <dim>5</dim> + </port> + </output> + </layer> + <layer id="4485" name="__module.model.layers.18.self_attn/aten::expand/Broadcast_1" type="Broadcast" version="opset3"> + <data mode="bidirectional" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>5</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3459,hidden_states.555"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4486" name="Constant_301809" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420648" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4487" name="__module.model.layers.18.self_attn/aten::reshape/Reshape_1" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3463"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4488" name="__module.model.layers.18.self_attn/aten::slice/Reshape_60" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4489" name="ShapeOf_299128" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4490" name="Constant_299129" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694668" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4491" name="Constant_299130" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="4492" name="Gather_299131" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4493" name="ShapeOf_299132" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4494" name="Constant_299133" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694668" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4495" name="Constant_299134" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="4496" name="Gather_299135" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4497" name="Add_299136" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64" names="3464"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4498" name="__module.model.layers.18.self_attn/aten::slice/Reshape_62" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4499" name="__module.model.layers.18.self_attn/aten::slice/Reshape_63" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4500" name="__module.model.layers.18.self_attn/aten::slice/Slice_15" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="3468"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="4501" name="__module.model.layers.18.self_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> + <data causal="false" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="3469,attn_output.73"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4502" name="__module.model.layers.18.self_attn/aten::transpose/ScatterElementsUpdate_3" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4503" name="__module.model.layers.18.self_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3470"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4504" name="Constant_301810" type="Const" version="opset1"> + <data element_type="i64" shape="3" offset="798146608" size="24" /> + <output> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="4505" name="__module.model.layers.18.self_attn/aten::view/Reshape_3" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>3</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3473"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="4506" name="self.model.layers.18.self_attn.o_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 128" offset="3373170808" size="13107200" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4507" name="Convert_386397" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4508" name="self.model.layers.18.self_attn.o_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 1" offset="3386278008" size="102400" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4509" name="Convert_386399" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4510" name="self.model.layers.18.self_attn.o_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4511" name="self.model.layers.18.self_attn.o_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="5120, 40, 1" offset="3386380408" size="409600" /> + <output> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4512" name="self.model.layers.18.self_attn.o_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4513" name="Constant_386404" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="792684080" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="4514" name="Reshape_386405" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="4515" name="__module.model.layers.18.self_attn.o_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="4516" name="__module.model.layers.18.self_attn.o_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3475,3477,hidden_states.557"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="4517" name="__module.model.layers.18/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3480,3482,3493,hidden_states.559,hidden_states.561"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="4518" name="Constant_290237" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 5120" offset="3386790008" size="20480" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="4519" name="Constant_290236" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064860" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4520" name="Constant_290234" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064864" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4521" name="__module.model.layers.18.post_attention_layernorm/aten::pow/Power" type="Power" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3483"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="4522" name="Constant_13220" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64" names="3484"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4523" name="__module.model.layers.18.post_attention_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> + <data keep_dims="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3485,variance.75"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4524" name="Constant_290235" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064876" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4525" name="__module.model.layers.18.post_attention_layernorm/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3486"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4526" name="__module.model.layers.18.post_attention_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4527" name="__module.model.layers.18.post_attention_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3487"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4528" name="__module.model.layers.18.post_attention_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3488,3489,hidden_states.563,hidden_states.565"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="4529" name="__module.model.layers.18.post_attention_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3490,3492"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="4530" name="self.model.layers.18.mlp.gate_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 128" offset="3386810488" size="35389440" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4531" name="Convert_385137" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4532" name="self.model.layers.18.mlp.gate_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 1" offset="3422199928" size="276480" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4533" name="Convert_385139" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4534" name="self.model.layers.18.mlp.gate_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4535" name="self.model.layers.18.mlp.gate_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="13824, 40, 1" offset="3422476408" size="1105920" /> + <output> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4536" name="self.model.layers.18.mlp.gate_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4537" name="Constant_385144" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="848558152" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="4538" name="Reshape_385145" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="4539" name="__module.model.layers.18.mlp.gate_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="4540" name="__module.model.layers.18.mlp.gate_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3498,input.37"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="4541" name="__module.model.layers.18.mlp.act_fn/aten::silu/Swish" type="Swish" version="opset4"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="3499"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="4542" name="self.model.layers.18.mlp.up_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 128" offset="3423582328" size="35389440" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4543" name="Convert_385127" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4544" name="self.model.layers.18.mlp.up_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 1" offset="3458971768" size="276480" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4545" name="Convert_385129" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4546" name="self.model.layers.18.mlp.up_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4547" name="self.model.layers.18.mlp.up_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="13824, 40, 1" offset="3459248248" size="1105920" /> + <output> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4548" name="self.model.layers.18.mlp.up_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4549" name="Constant_385134" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="848558152" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="4550" name="Reshape_385135" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="4551" name="__module.model.layers.18.mlp.up_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="4552" name="__module.model.layers.18.mlp.up_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3501"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="4553" name="__module.model.layers.18.mlp/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3502"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="4554" name="self.model.layers.18.mlp.down_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 108, 128" offset="3460354168" size="35389440" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4555" name="Convert_385147" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4556" name="self.model.layers.18.mlp.down_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 108, 1" offset="3495743608" size="276480" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4557" name="Convert_385149" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4558" name="self.model.layers.18.mlp.down_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4559" name="self.model.layers.18.mlp.down_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="5120, 108, 1" offset="3496020088" size="1105920" /> + <output> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4560" name="self.model.layers.18.mlp.down_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4561" name="Constant_385154" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="922101848" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="4562" name="Reshape_385155" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="4563" name="__module.model.layers.18.mlp.down_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="4564" name="__module.model.layers.18.mlp.down_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3504,hidden_states.567"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="4565" name="__module.model.layers.18/aten::add/Add_1" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3505,3507,3515,3526,hidden_states.569,hidden_states.571"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="4566" name="Constant_290241" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 5120" offset="3497126008" size="20480" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="4567" name="Constant_290240" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064860" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4568" name="Constant_290238" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064864" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4569" name="__module.model.layers.19.input_layernorm/aten::pow/Power" type="Power" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3516"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="4570" name="Constant_13294" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64" names="3517"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4571" name="__module.model.layers.19.input_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> + <data keep_dims="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3518,variance.77"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4572" name="Constant_290239" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064876" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4573" name="__module.model.layers.19.input_layernorm/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3519"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4574" name="__module.model.layers.19.input_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4575" name="__module.model.layers.19.input_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3520"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4576" name="__module.model.layers.19.input_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3521,3522,hidden_states.573,hidden_states.575"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="4577" name="__module.model.layers.19.input_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3523,3525,hidden_states.577"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="4578" name="self.model.layers.19.self_attn.q_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 128" offset="3497146488" size="13107200" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4579" name="Convert_386407" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4580" name="self.model.layers.19.self_attn.q_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 1" offset="3510253688" size="102400" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4581" name="Convert_386409" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4582" name="self.model.layers.19.self_attn.q_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4583" name="self.model.layers.19.self_attn.q_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="5120, 40, 1" offset="3510356088" size="409600" /> + <output> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4584" name="self.model.layers.19.self_attn.q_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4585" name="Constant_386414" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="792684080" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="4586" name="Reshape_386415" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="4587" name="__module.model.layers.19.self_attn.q_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="4588" name="__module.model.layers.19.self_attn.q_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="4589" name="self.model.layers.19.self_attn.q_proj.bias" type="Const" version="opset1"> + <data element_type="bf16" shape="5120" offset="3510765688" size="10240" /> + <output> + <port id="0" precision="BF16" names="self.model.layers.19.self_attn.q_proj.bias"> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="4590" name="__module.model.layers.19.self_attn.q_proj/prim::PythonOp/ConvertLike_1" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="BF16"> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="4591" name="__module.model.layers.19.self_attn.q_proj/prim::PythonOp/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3535,query_states.39"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="4592" name="Constant_301811" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="792694336" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4593" name="__module.model.layers.19.self_attn/aten::view/Reshape" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3543"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4594" name="__module.model.layers.19.self_attn/aten::transpose/ScatterElementsUpdate" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4595" name="__module.model.layers.19.self_attn/aten::transpose/Transpose" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3544,q.39"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4596" name="__module.model.layers.19.self_attn/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3553"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4597" name="__module.model.layers.19.self_attn/aten::size/ShapeOf_3" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4598" name="__module.model.layers.19.self_attn/aten::size/Constant_3" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="4599" name="__module.model.layers.19.self_attn/aten::size/Gather_3" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="3554,3559" /> + </output> + </layer> + <layer id="4600" name="__module.model.layers.19.self_attn/aten::floor_divide/Divide_1" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" /> + </output> + </layer> + <layer id="4601" name="__module.model.layers.19.self_attn/aten::floor_divide/Floor_1" type="Floor" version="opset1"> + <input> + <port id="0" precision="I64" /> + </input> + <output> + <port id="1" precision="I64" names="3556,3557,3561,3562" /> + </output> + </layer> + <layer id="4602" name="Constant_220830" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4603" name="__module.model.layers.19.self_attn/aten::slice/Reshape_5" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4604" name="__module.model.layers.19.self_attn/aten::slice/Reshape_1" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694676" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4605" name="__module.model.layers.19.self_attn/aten::slice/Reshape_2" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4606" name="__module.model.layers.19.self_attn/aten::slice/Reshape_3" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4607" name="__module.model.layers.19.self_attn/aten::slice/Slice" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="3563,x2.77"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="4608" name="Constant_290242" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1, 1" offset="792694684" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4609" name="__module.model.layers.19.self_attn/aten::neg/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3564"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="4610" name="__module.model.layers.19.self_attn/aten::slice/Reshape_4" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4611" name="__module.model.layers.19.self_attn/aten::slice/Reshape_6" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4612" name="__module.model.layers.19.self_attn/aten::slice/Reshape_7" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4613" name="__module.model.layers.19.self_attn/aten::slice/Slice_1" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="3558"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="4614" name="__module.model.layers.19.self_attn/aten::cat/Concat" type="Concat" version="opset1"> + <data axis="-1" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3566"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4615" name="__module.model.layers.19.self_attn/aten::mul/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3567"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4616" name="__module.model.layers.19.self_attn/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3568"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4617" name="Constant_341269" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="4618" name="Constant_341262" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="12" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4619" name="Constant_341264" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4620" name="Constant_341266" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="20" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4621" name="Concat_341267" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4622" name="Broadcast_341270" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32" /> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4623" name="ReadValue_333120" type="ReadValue" version="opset6"> + <data variable_id="past_key_values.19.keypresent.19.key" variable_type="f32" variable_shape="?,8,?,128" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="past_key_values.19.key"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4624" name="Constant_325423" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="4625" name="Gather_325424" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4626" name="self.model.layers.19.self_attn.k_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 128" offset="3510775928" size="2621440" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4627" name="Convert_387367" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4628" name="self.model.layers.19.self_attn.k_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 1" offset="3513397368" size="20480" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4629" name="Convert_387369" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4630" name="self.model.layers.19.self_attn.k_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4631" name="self.model.layers.19.self_attn.k_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="1024, 40, 1" offset="3513417848" size="81920" /> + <output> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4632" name="self.model.layers.19.self_attn.k_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4633" name="Constant_387374" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795418528" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="4634" name="Reshape_387375" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="4635" name="__module.model.layers.19.self_attn.k_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="4636" name="__module.model.layers.19.self_attn.k_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="4637" name="self.model.layers.19.self_attn.k_proj.bias" type="Const" version="opset1"> + <data element_type="bf16" shape="1024" offset="3513499768" size="2048" /> + <output> + <port id="0" precision="BF16" names="self.model.layers.19.self_attn.k_proj.bias"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="4638" name="__module.model.layers.19.self_attn.k_proj/prim::PythonOp/ConvertLike_1" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="BF16"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="4639" name="__module.model.layers.19.self_attn.k_proj/prim::PythonOp/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3538,key_states.81"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="4640" name="Constant_301812" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420592" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4641" name="__module.model.layers.19.self_attn/aten::view/Reshape_1" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3546"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4642" name="__module.model.layers.19.self_attn/aten::transpose/ScatterElementsUpdate_1" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4643" name="__module.model.layers.19.self_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3547,k.39"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4644" name="__module.model.layers.19.self_attn/aten::mul/Multiply_2" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3569"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4645" name="__module.model.layers.19.self_attn/aten::size/ShapeOf_5" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4646" name="__module.model.layers.19.self_attn/aten::size/Constant_5" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="4647" name="__module.model.layers.19.self_attn/aten::size/Gather_5" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="3570,3575" /> + </output> + </layer> + <layer id="4648" name="__module.model.layers.19.self_attn/aten::floor_divide/Divide_3" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" /> + </output> + </layer> + <layer id="4649" name="__module.model.layers.19.self_attn/aten::floor_divide/Floor_3" type="Floor" version="opset1"> + <input> + <port id="0" precision="I64" /> + </input> + <output> + <port id="1" precision="I64" names="3572,3573,3577,3578" /> + </output> + </layer> + <layer id="4650" name="Constant_220831" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4651" name="__module.model.layers.19.self_attn/aten::slice/Reshape_13" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4652" name="__module.model.layers.19.self_attn/aten::slice/Reshape_9" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694676" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4653" name="__module.model.layers.19.self_attn/aten::slice/Reshape_10" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4654" name="__module.model.layers.19.self_attn/aten::slice/Reshape_11" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4655" name="__module.model.layers.19.self_attn/aten::slice/Slice_2" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="3579,x2.79"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="4656" name="Constant_290243" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1, 1" offset="792694684" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4657" name="__module.model.layers.19.self_attn/aten::neg/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3580"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="4658" name="__module.model.layers.19.self_attn/aten::slice/Reshape_12" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4659" name="__module.model.layers.19.self_attn/aten::slice/Reshape_14" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4660" name="__module.model.layers.19.self_attn/aten::slice/Reshape_15" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4661" name="__module.model.layers.19.self_attn/aten::slice/Slice_3" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="3574"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="4662" name="__module.model.layers.19.self_attn/aten::cat/Concat_1" type="Concat" version="opset1"> + <data axis="-1" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3582"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4663" name="__module.model.layers.19.self_attn/aten::mul/Multiply_3" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3583"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4664" name="__module.model.layers.19.self_attn/aten::add/Add_1" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3584"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4665" name="__module.model.layers.19.self_attn/aten::cat/Concat_2" type="Concat" version="opset1"> + <data axis="-2" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="present.19.key"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4666" name="__module.model.layers.19.self_attn/aten::unsqueeze/Unsqueeze_2" type="Unsqueeze" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="FP32" names="3596,3597,3598"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4667" name="__module.model.layers.19.self_attn/aten::size/ShapeOf_6" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4668" name="Constant_302459" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="938477672" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="4669" name="Constant_302460" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="4670" name="Gather_302461" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="4671" name="Constant_268518" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="795420624" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4672" name="Constant_276856" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795420632" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="4673" name="Constant_276857" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="4674" name="Gather_276858" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="4675" name="__module.model.layers.19.self_attn/prim::ListConstruct/Concat_2" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="3" precision="I64" names="3599"> + <dim>5</dim> + </port> + </output> + </layer> + <layer id="4676" name="__module.model.layers.19.self_attn/aten::expand/Broadcast" type="Broadcast" version="opset3"> + <data mode="bidirectional" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>5</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3600,hidden_states.581"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4677" name="Constant_301813" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420648" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4678" name="__module.model.layers.19.self_attn/aten::reshape/Reshape" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3604,key_states.83"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4679" name="Constant_341282" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="4680" name="Constant_341275" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="12" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4681" name="Constant_341277" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4682" name="Constant_341279" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="20" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4683" name="Concat_341280" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4684" name="Broadcast_341283" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32" /> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4685" name="ReadValue_333122" type="ReadValue" version="opset6"> + <data variable_id="past_key_values.19.valuepresent.19.value" variable_type="f32" variable_shape="?,8,?,128" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="past_key_values.19.value"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4686" name="Constant_325426" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="4687" name="Gather_325427" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4688" name="self.model.layers.19.self_attn.v_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 128" offset="3513501816" size="2621440" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4689" name="Convert_387377" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4690" name="self.model.layers.19.self_attn.v_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 1" offset="3516123256" size="20480" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4691" name="Convert_387379" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4692" name="self.model.layers.19.self_attn.v_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4693" name="self.model.layers.19.self_attn.v_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="1024, 40, 1" offset="3516143736" size="81920" /> + <output> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4694" name="self.model.layers.19.self_attn.v_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4695" name="Constant_387384" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795418528" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="4696" name="Reshape_387385" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="4697" name="__module.model.layers.19.self_attn.v_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="4698" name="__module.model.layers.19.self_attn.v_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="4699" name="self.model.layers.19.self_attn.v_proj.bias" type="Const" version="opset1"> + <data element_type="bf16" shape="1024" offset="3516225656" size="2048" /> + <output> + <port id="0" precision="BF16" names="self.model.layers.19.self_attn.v_proj.bias"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="4700" name="__module.model.layers.19.self_attn.v_proj/prim::PythonOp/ConvertLike_1" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="BF16"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="4701" name="__module.model.layers.19.self_attn.v_proj/prim::PythonOp/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3541,value_states.39"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="4702" name="Constant_301814" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420592" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4703" name="__module.model.layers.19.self_attn/aten::view/Reshape_2" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3549"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4704" name="__module.model.layers.19.self_attn/aten::transpose/ScatterElementsUpdate_2" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4705" name="__module.model.layers.19.self_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3550"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4706" name="__module.model.layers.19.self_attn/aten::cat/Concat_3" type="Concat" version="opset1"> + <data axis="-2" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="present.19.value"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4707" name="__module.model.layers.19.self_attn/aten::unsqueeze/Unsqueeze_3" type="Unsqueeze" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="FP32" names="3612,3613,3614"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4708" name="__module.model.layers.19.self_attn/aten::size/ShapeOf_10" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4709" name="Constant_302199" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4710" name="__module.model.layers.19.self_attn/aten::size/Constant_11" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="4711" name="__module.model.layers.19.self_attn/aten::size/Gather_11" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="3606"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4712" name="Constant_268536" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="795420624" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4713" name="Constant_276866" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795420632" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="4714" name="Constant_276867" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="4715" name="Gather_276868" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="4716" name="__module.model.layers.19.self_attn/prim::ListConstruct/Concat_5" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="4" precision="I64" names="3615"> + <dim>5</dim> + </port> + </output> + </layer> + <layer id="4717" name="__module.model.layers.19.self_attn/aten::expand/Broadcast_1" type="Broadcast" version="opset3"> + <data mode="bidirectional" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>5</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3616,hidden_states.585"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4718" name="Constant_301815" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420648" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4719" name="__module.model.layers.19.self_attn/aten::reshape/Reshape_1" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3620"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4720" name="__module.model.layers.19.self_attn/aten::slice/Reshape_60" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4721" name="ShapeOf_299214" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4722" name="Constant_299215" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694668" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4723" name="Constant_299216" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="4724" name="Gather_299217" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4725" name="ShapeOf_299218" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4726" name="Constant_299219" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694668" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4727" name="Constant_299220" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="4728" name="Gather_299221" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4729" name="Add_299222" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64" names="3621"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4730" name="__module.model.layers.19.self_attn/aten::slice/Reshape_62" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4731" name="__module.model.layers.19.self_attn/aten::slice/Reshape_63" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4732" name="__module.model.layers.19.self_attn/aten::slice/Slice_15" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="3625"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="4733" name="__module.model.layers.19.self_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> + <data causal="false" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="3626,attn_output.77"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4734" name="__module.model.layers.19.self_attn/aten::transpose/ScatterElementsUpdate_3" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4735" name="__module.model.layers.19.self_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3627"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4736" name="Constant_301816" type="Const" version="opset1"> + <data element_type="i64" shape="3" offset="798146608" size="24" /> + <output> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="4737" name="__module.model.layers.19.self_attn/aten::view/Reshape_3" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>3</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3630"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="4738" name="self.model.layers.19.self_attn.o_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 128" offset="3516227704" size="13107200" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4739" name="Convert_386417" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4740" name="self.model.layers.19.self_attn.o_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 1" offset="3529334904" size="102400" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4741" name="Convert_386419" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4742" name="self.model.layers.19.self_attn.o_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4743" name="self.model.layers.19.self_attn.o_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="5120, 40, 1" offset="3529437304" size="409600" /> + <output> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4744" name="self.model.layers.19.self_attn.o_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4745" name="Constant_386424" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="792684080" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="4746" name="Reshape_386425" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="4747" name="__module.model.layers.19.self_attn.o_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="4748" name="__module.model.layers.19.self_attn.o_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3632,3634,hidden_states.587"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="4749" name="__module.model.layers.19/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3637,3639,3650,hidden_states.589,hidden_states.591"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="4750" name="Constant_290247" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 5120" offset="3529846904" size="20480" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="4751" name="Constant_290246" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064860" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4752" name="Constant_290244" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064864" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4753" name="__module.model.layers.19.post_attention_layernorm/aten::pow/Power" type="Power" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3640"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="4754" name="Constant_13892" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64" names="3641"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4755" name="__module.model.layers.19.post_attention_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> + <data keep_dims="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3642,variance.79"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4756" name="Constant_290245" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064876" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4757" name="__module.model.layers.19.post_attention_layernorm/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3643"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4758" name="__module.model.layers.19.post_attention_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4759" name="__module.model.layers.19.post_attention_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3644"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4760" name="__module.model.layers.19.post_attention_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3645,3646,hidden_states.593,hidden_states.595"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="4761" name="__module.model.layers.19.post_attention_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3647,3649"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="4762" name="self.model.layers.19.mlp.gate_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 128" offset="3529867384" size="35389440" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4763" name="Convert_385167" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4764" name="self.model.layers.19.mlp.gate_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 1" offset="3565256824" size="276480" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4765" name="Convert_385169" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4766" name="self.model.layers.19.mlp.gate_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4767" name="self.model.layers.19.mlp.gate_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="13824, 40, 1" offset="3565533304" size="1105920" /> + <output> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4768" name="self.model.layers.19.mlp.gate_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4769" name="Constant_385174" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="848558152" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="4770" name="Reshape_385175" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="4771" name="__module.model.layers.19.mlp.gate_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="4772" name="__module.model.layers.19.mlp.gate_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3655,input.39"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="4773" name="__module.model.layers.19.mlp.act_fn/aten::silu/Swish" type="Swish" version="opset4"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="3656"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="4774" name="self.model.layers.19.mlp.up_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 128" offset="3566639224" size="35389440" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4775" name="Convert_385157" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4776" name="self.model.layers.19.mlp.up_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 1" offset="3602028664" size="276480" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4777" name="Convert_385159" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4778" name="self.model.layers.19.mlp.up_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4779" name="self.model.layers.19.mlp.up_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="13824, 40, 1" offset="3602305144" size="1105920" /> + <output> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4780" name="self.model.layers.19.mlp.up_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4781" name="Constant_385164" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="848558152" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="4782" name="Reshape_385165" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="4783" name="__module.model.layers.19.mlp.up_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="4784" name="__module.model.layers.19.mlp.up_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3658"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="4785" name="__module.model.layers.19.mlp/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3659"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="4786" name="self.model.layers.19.mlp.down_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 108, 128" offset="3603411064" size="35389440" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4787" name="Convert_385177" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4788" name="self.model.layers.19.mlp.down_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 108, 1" offset="3638800504" size="276480" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4789" name="Convert_385179" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4790" name="self.model.layers.19.mlp.down_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4791" name="self.model.layers.19.mlp.down_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="5120, 108, 1" offset="3639076984" size="1105920" /> + <output> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4792" name="self.model.layers.19.mlp.down_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4793" name="Constant_385184" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="922101848" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="4794" name="Reshape_385185" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="4795" name="__module.model.layers.19.mlp.down_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="4796" name="__module.model.layers.19.mlp.down_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3661,hidden_states.597"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="4797" name="__module.model.layers.19/aten::add/Add_1" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3662,3664,3672,3683,hidden_states.599,hidden_states.601"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="4798" name="Constant_290251" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 5120" offset="3640182904" size="20480" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="4799" name="Constant_290250" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064860" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4800" name="Constant_290248" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064864" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4801" name="__module.model.layers.20.input_layernorm/aten::pow/Power" type="Power" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3673"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="4802" name="Constant_13966" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64" names="3674"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4803" name="__module.model.layers.20.input_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> + <data keep_dims="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3675,variance.81"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4804" name="Constant_290249" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064876" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4805" name="__module.model.layers.20.input_layernorm/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3676"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4806" name="__module.model.layers.20.input_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4807" name="__module.model.layers.20.input_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3677"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4808" name="__module.model.layers.20.input_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3678,3679,hidden_states.603,hidden_states.605"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="4809" name="__module.model.layers.20.input_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3680,3682,hidden_states.607"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="4810" name="self.model.layers.20.self_attn.q_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 128" offset="3640203384" size="13107200" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4811" name="Convert_386427" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4812" name="self.model.layers.20.self_attn.q_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 1" offset="3653310584" size="102400" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4813" name="Convert_386429" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4814" name="self.model.layers.20.self_attn.q_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4815" name="self.model.layers.20.self_attn.q_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="5120, 40, 1" offset="3653412984" size="409600" /> + <output> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4816" name="self.model.layers.20.self_attn.q_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4817" name="Constant_386434" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="792684080" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="4818" name="Reshape_386435" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="4819" name="__module.model.layers.20.self_attn.q_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="4820" name="__module.model.layers.20.self_attn.q_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="4821" name="self.model.layers.20.self_attn.q_proj.bias" type="Const" version="opset1"> + <data element_type="bf16" shape="5120" offset="3653822584" size="10240" /> + <output> + <port id="0" precision="BF16" names="self.model.layers.20.self_attn.q_proj.bias"> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="4822" name="__module.model.layers.20.self_attn.q_proj/prim::PythonOp/ConvertLike_1" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="BF16"> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="4823" name="__module.model.layers.20.self_attn.q_proj/prim::PythonOp/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3692,query_states.41"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="4824" name="Constant_301817" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="792694336" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4825" name="__module.model.layers.20.self_attn/aten::view/Reshape" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3700"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4826" name="__module.model.layers.20.self_attn/aten::transpose/ScatterElementsUpdate" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4827" name="__module.model.layers.20.self_attn/aten::transpose/Transpose" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3701,q.41"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4828" name="__module.model.layers.20.self_attn/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3710"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4829" name="__module.model.layers.20.self_attn/aten::size/ShapeOf_3" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4830" name="__module.model.layers.20.self_attn/aten::size/Constant_3" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="4831" name="__module.model.layers.20.self_attn/aten::size/Gather_3" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="3711,3716" /> + </output> + </layer> + <layer id="4832" name="__module.model.layers.20.self_attn/aten::floor_divide/Divide_1" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" /> + </output> + </layer> + <layer id="4833" name="__module.model.layers.20.self_attn/aten::floor_divide/Floor_1" type="Floor" version="opset1"> + <input> + <port id="0" precision="I64" /> + </input> + <output> + <port id="1" precision="I64" names="3713,3714,3718,3719" /> + </output> + </layer> + <layer id="4834" name="Constant_220845" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4835" name="__module.model.layers.20.self_attn/aten::slice/Reshape_5" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4836" name="__module.model.layers.20.self_attn/aten::slice/Reshape_1" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694676" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4837" name="__module.model.layers.20.self_attn/aten::slice/Reshape_2" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4838" name="__module.model.layers.20.self_attn/aten::slice/Reshape_3" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4839" name="__module.model.layers.20.self_attn/aten::slice/Slice" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="3720,x2.81"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="4840" name="Constant_290252" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1, 1" offset="792694684" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4841" name="__module.model.layers.20.self_attn/aten::neg/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3721"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="4842" name="__module.model.layers.20.self_attn/aten::slice/Reshape_4" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4843" name="__module.model.layers.20.self_attn/aten::slice/Reshape_6" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4844" name="__module.model.layers.20.self_attn/aten::slice/Reshape_7" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4845" name="__module.model.layers.20.self_attn/aten::slice/Slice_1" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="3715"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="4846" name="__module.model.layers.20.self_attn/aten::cat/Concat" type="Concat" version="opset1"> + <data axis="-1" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3723"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4847" name="__module.model.layers.20.self_attn/aten::mul/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3724"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4848" name="__module.model.layers.20.self_attn/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3725"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4849" name="Constant_341295" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="4850" name="Constant_341288" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="12" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4851" name="Constant_341290" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4852" name="Constant_341292" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="20" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4853" name="Concat_341293" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4854" name="Broadcast_341296" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32" /> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4855" name="ReadValue_333128" type="ReadValue" version="opset6"> + <data variable_id="past_key_values.20.keypresent.20.key" variable_type="f32" variable_shape="?,8,?,128" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="past_key_values.20.key"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4856" name="Constant_325429" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="4857" name="Gather_325430" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4858" name="self.model.layers.20.self_attn.k_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 128" offset="3653832824" size="2621440" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4859" name="Convert_387387" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4860" name="self.model.layers.20.self_attn.k_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 1" offset="3656454264" size="20480" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4861" name="Convert_387389" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4862" name="self.model.layers.20.self_attn.k_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4863" name="self.model.layers.20.self_attn.k_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="1024, 40, 1" offset="3656474744" size="81920" /> + <output> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4864" name="self.model.layers.20.self_attn.k_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4865" name="Constant_387394" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795418528" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="4866" name="Reshape_387395" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="4867" name="__module.model.layers.20.self_attn.k_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="4868" name="__module.model.layers.20.self_attn.k_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="4869" name="self.model.layers.20.self_attn.k_proj.bias" type="Const" version="opset1"> + <data element_type="bf16" shape="1024" offset="3656556664" size="2048" /> + <output> + <port id="0" precision="BF16" names="self.model.layers.20.self_attn.k_proj.bias"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="4870" name="__module.model.layers.20.self_attn.k_proj/prim::PythonOp/ConvertLike_1" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="BF16"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="4871" name="__module.model.layers.20.self_attn.k_proj/prim::PythonOp/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3695,key_states.85"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="4872" name="Constant_301818" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420592" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4873" name="__module.model.layers.20.self_attn/aten::view/Reshape_1" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3703"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4874" name="__module.model.layers.20.self_attn/aten::transpose/ScatterElementsUpdate_1" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4875" name="__module.model.layers.20.self_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3704,k.41"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4876" name="__module.model.layers.20.self_attn/aten::mul/Multiply_2" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3726"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4877" name="__module.model.layers.20.self_attn/aten::size/ShapeOf_5" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4878" name="__module.model.layers.20.self_attn/aten::size/Constant_5" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="4879" name="__module.model.layers.20.self_attn/aten::size/Gather_5" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="3727,3732" /> + </output> + </layer> + <layer id="4880" name="__module.model.layers.20.self_attn/aten::floor_divide/Divide_3" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" /> + </output> + </layer> + <layer id="4881" name="__module.model.layers.20.self_attn/aten::floor_divide/Floor_3" type="Floor" version="opset1"> + <input> + <port id="0" precision="I64" /> + </input> + <output> + <port id="1" precision="I64" names="3729,3730,3734,3735" /> + </output> + </layer> + <layer id="4882" name="Constant_220846" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4883" name="__module.model.layers.20.self_attn/aten::slice/Reshape_13" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4884" name="__module.model.layers.20.self_attn/aten::slice/Reshape_9" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694676" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4885" name="__module.model.layers.20.self_attn/aten::slice/Reshape_10" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4886" name="__module.model.layers.20.self_attn/aten::slice/Reshape_11" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4887" name="__module.model.layers.20.self_attn/aten::slice/Slice_2" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="3736,x2.83"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="4888" name="Constant_290253" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1, 1" offset="792694684" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4889" name="__module.model.layers.20.self_attn/aten::neg/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3737"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="4890" name="__module.model.layers.20.self_attn/aten::slice/Reshape_12" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4891" name="__module.model.layers.20.self_attn/aten::slice/Reshape_14" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4892" name="__module.model.layers.20.self_attn/aten::slice/Reshape_15" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4893" name="__module.model.layers.20.self_attn/aten::slice/Slice_3" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="3731"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="4894" name="__module.model.layers.20.self_attn/aten::cat/Concat_1" type="Concat" version="opset1"> + <data axis="-1" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3739"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4895" name="__module.model.layers.20.self_attn/aten::mul/Multiply_3" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3740"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4896" name="__module.model.layers.20.self_attn/aten::add/Add_1" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3741"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4897" name="__module.model.layers.20.self_attn/aten::cat/Concat_2" type="Concat" version="opset1"> + <data axis="-2" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="present.20.key"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4898" name="__module.model.layers.20.self_attn/aten::unsqueeze/Unsqueeze_2" type="Unsqueeze" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="FP32" names="3753,3754,3755"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4899" name="__module.model.layers.20.self_attn/aten::size/ShapeOf_6" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4900" name="Constant_302464" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="938477672" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="4901" name="Constant_302465" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="4902" name="Gather_302466" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="4903" name="Constant_268554" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="795420624" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4904" name="Constant_276891" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795420632" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="4905" name="Constant_276892" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="4906" name="Gather_276893" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="4907" name="__module.model.layers.20.self_attn/prim::ListConstruct/Concat_2" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="3" precision="I64" names="3756"> + <dim>5</dim> + </port> + </output> + </layer> + <layer id="4908" name="__module.model.layers.20.self_attn/aten::expand/Broadcast" type="Broadcast" version="opset3"> + <data mode="bidirectional" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>5</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3757,hidden_states.611"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4909" name="Constant_301819" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420648" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4910" name="__module.model.layers.20.self_attn/aten::reshape/Reshape" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3761,key_states.87"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4911" name="Constant_341308" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="4912" name="Constant_341301" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="12" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4913" name="Constant_341303" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4914" name="Constant_341305" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="20" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4915" name="Concat_341306" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4916" name="Broadcast_341309" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32" /> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4917" name="ReadValue_333130" type="ReadValue" version="opset6"> + <data variable_id="past_key_values.20.valuepresent.20.value" variable_type="f32" variable_shape="?,8,?,128" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="past_key_values.20.value"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4918" name="Constant_325432" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="4919" name="Gather_325433" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4920" name="self.model.layers.20.self_attn.v_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 128" offset="3656558712" size="2621440" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4921" name="Convert_387397" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4922" name="self.model.layers.20.self_attn.v_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 1" offset="3659180152" size="20480" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4923" name="Convert_387399" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4924" name="self.model.layers.20.self_attn.v_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4925" name="self.model.layers.20.self_attn.v_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="1024, 40, 1" offset="3659200632" size="81920" /> + <output> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4926" name="self.model.layers.20.self_attn.v_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4927" name="Constant_387404" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795418528" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="4928" name="Reshape_387405" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="4929" name="__module.model.layers.20.self_attn.v_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="4930" name="__module.model.layers.20.self_attn.v_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="4931" name="self.model.layers.20.self_attn.v_proj.bias" type="Const" version="opset1"> + <data element_type="bf16" shape="1024" offset="3659282552" size="2048" /> + <output> + <port id="0" precision="BF16" names="self.model.layers.20.self_attn.v_proj.bias"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="4932" name="__module.model.layers.20.self_attn.v_proj/prim::PythonOp/ConvertLike_1" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="BF16"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="4933" name="__module.model.layers.20.self_attn.v_proj/prim::PythonOp/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3698,value_states.41"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="4934" name="Constant_301820" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420592" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4935" name="__module.model.layers.20.self_attn/aten::view/Reshape_2" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3706"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4936" name="__module.model.layers.20.self_attn/aten::transpose/ScatterElementsUpdate_2" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4937" name="__module.model.layers.20.self_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3707"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4938" name="__module.model.layers.20.self_attn/aten::cat/Concat_3" type="Concat" version="opset1"> + <data axis="-2" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="present.20.value"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4939" name="__module.model.layers.20.self_attn/aten::unsqueeze/Unsqueeze_3" type="Unsqueeze" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="FP32" names="3769,3770,3771"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4940" name="__module.model.layers.20.self_attn/aten::size/ShapeOf_10" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4941" name="Constant_302205" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4942" name="__module.model.layers.20.self_attn/aten::size/Constant_11" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="4943" name="__module.model.layers.20.self_attn/aten::size/Gather_11" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="3763"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4944" name="Constant_268572" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="795420624" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4945" name="Constant_276901" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795420632" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="4946" name="Constant_276902" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="4947" name="Gather_276903" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="4948" name="__module.model.layers.20.self_attn/prim::ListConstruct/Concat_5" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="4" precision="I64" names="3772"> + <dim>5</dim> + </port> + </output> + </layer> + <layer id="4949" name="__module.model.layers.20.self_attn/aten::expand/Broadcast_1" type="Broadcast" version="opset3"> + <data mode="bidirectional" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>5</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3773,hidden_states.615"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4950" name="Constant_301821" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420648" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4951" name="__module.model.layers.20.self_attn/aten::reshape/Reshape_1" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3777"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4952" name="__module.model.layers.20.self_attn/aten::slice/Reshape_60" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4953" name="ShapeOf_299300" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4954" name="Constant_299301" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694668" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4955" name="Constant_299302" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="4956" name="Gather_299303" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4957" name="ShapeOf_299304" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4958" name="Constant_299305" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694668" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4959" name="Constant_299306" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="4960" name="Gather_299307" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4961" name="Add_299308" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64" names="3778"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4962" name="__module.model.layers.20.self_attn/aten::slice/Reshape_62" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4963" name="__module.model.layers.20.self_attn/aten::slice/Reshape_63" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4964" name="__module.model.layers.20.self_attn/aten::slice/Slice_15" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="3782"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="4965" name="__module.model.layers.20.self_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> + <data causal="false" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="3783,attn_output.81"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4966" name="__module.model.layers.20.self_attn/aten::transpose/ScatterElementsUpdate_3" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="4967" name="__module.model.layers.20.self_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3784"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4968" name="Constant_301822" type="Const" version="opset1"> + <data element_type="i64" shape="3" offset="798146608" size="24" /> + <output> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="4969" name="__module.model.layers.20.self_attn/aten::view/Reshape_3" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>3</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3787"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="4970" name="self.model.layers.20.self_attn.o_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 128" offset="3659284600" size="13107200" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4971" name="Convert_386437" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4972" name="self.model.layers.20.self_attn.o_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 1" offset="3672391800" size="102400" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4973" name="Convert_386439" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4974" name="self.model.layers.20.self_attn.o_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4975" name="self.model.layers.20.self_attn.o_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="5120, 40, 1" offset="3672494200" size="409600" /> + <output> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4976" name="self.model.layers.20.self_attn.o_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4977" name="Constant_386444" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="792684080" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="4978" name="Reshape_386445" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="4979" name="__module.model.layers.20.self_attn.o_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="4980" name="__module.model.layers.20.self_attn.o_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3789,3791,hidden_states.617"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="4981" name="__module.model.layers.20/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3794,3796,3807,hidden_states.619,hidden_states.621"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="4982" name="Constant_290257" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 5120" offset="3672903800" size="20480" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="4983" name="Constant_290256" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064860" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4984" name="Constant_290254" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064864" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4985" name="__module.model.layers.20.post_attention_layernorm/aten::pow/Power" type="Power" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3797"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="4986" name="Constant_14564" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64" names="3798"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4987" name="__module.model.layers.20.post_attention_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> + <data keep_dims="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3799,variance.83"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4988" name="Constant_290255" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064876" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4989" name="__module.model.layers.20.post_attention_layernorm/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3800"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4990" name="__module.model.layers.20.post_attention_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4991" name="__module.model.layers.20.post_attention_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3801"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4992" name="__module.model.layers.20.post_attention_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3802,3803,hidden_states.623,hidden_states.625"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="4993" name="__module.model.layers.20.post_attention_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3804,3806"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="4994" name="self.model.layers.20.mlp.gate_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 128" offset="3672924280" size="35389440" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4995" name="Convert_385197" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4996" name="self.model.layers.20.mlp.gate_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 1" offset="3708313720" size="276480" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4997" name="Convert_385199" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="4998" name="self.model.layers.20.mlp.gate_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="4999" name="self.model.layers.20.mlp.gate_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="13824, 40, 1" offset="3708590200" size="1105920" /> + <output> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5000" name="self.model.layers.20.mlp.gate_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5001" name="Constant_385204" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="848558152" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="5002" name="Reshape_385205" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="5003" name="__module.model.layers.20.mlp.gate_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="5004" name="__module.model.layers.20.mlp.gate_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3812,input.41"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="5005" name="__module.model.layers.20.mlp.act_fn/aten::silu/Swish" type="Swish" version="opset4"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="3813"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="5006" name="self.model.layers.20.mlp.up_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 128" offset="3709696120" size="35389440" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5007" name="Convert_385187" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5008" name="self.model.layers.20.mlp.up_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 1" offset="3745085560" size="276480" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5009" name="Convert_385189" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5010" name="self.model.layers.20.mlp.up_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5011" name="self.model.layers.20.mlp.up_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="13824, 40, 1" offset="3745362040" size="1105920" /> + <output> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5012" name="self.model.layers.20.mlp.up_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5013" name="Constant_385194" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="848558152" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="5014" name="Reshape_385195" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="5015" name="__module.model.layers.20.mlp.up_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="5016" name="__module.model.layers.20.mlp.up_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3815"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="5017" name="__module.model.layers.20.mlp/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3816"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="5018" name="self.model.layers.20.mlp.down_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 108, 128" offset="3746467960" size="35389440" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5019" name="Convert_385207" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5020" name="self.model.layers.20.mlp.down_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 108, 1" offset="3781857400" size="276480" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5021" name="Convert_385209" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5022" name="self.model.layers.20.mlp.down_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5023" name="self.model.layers.20.mlp.down_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="5120, 108, 1" offset="3782133880" size="1105920" /> + <output> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5024" name="self.model.layers.20.mlp.down_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5025" name="Constant_385214" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="922101848" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="5026" name="Reshape_385215" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="5027" name="__module.model.layers.20.mlp.down_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="5028" name="__module.model.layers.20.mlp.down_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3818,hidden_states.627"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="5029" name="__module.model.layers.20/aten::add/Add_1" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3819,3821,3829,3840,hidden_states.629,hidden_states.631"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="5030" name="Constant_290261" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 5120" offset="3783239800" size="20480" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="5031" name="Constant_290260" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064860" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5032" name="Constant_290258" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064864" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5033" name="__module.model.layers.21.input_layernorm/aten::pow/Power" type="Power" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3830"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="5034" name="Constant_14638" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64" names="3831"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5035" name="__module.model.layers.21.input_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> + <data keep_dims="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3832,variance.85"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5036" name="Constant_290259" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064876" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5037" name="__module.model.layers.21.input_layernorm/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3833"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5038" name="__module.model.layers.21.input_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5039" name="__module.model.layers.21.input_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3834"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5040" name="__module.model.layers.21.input_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3835,3836,hidden_states.633,hidden_states.635"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="5041" name="__module.model.layers.21.input_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3837,3839,hidden_states.637"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="5042" name="self.model.layers.21.self_attn.q_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 128" offset="3783260280" size="13107200" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5043" name="Convert_386447" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5044" name="self.model.layers.21.self_attn.q_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 1" offset="3796367480" size="102400" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5045" name="Convert_386449" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5046" name="self.model.layers.21.self_attn.q_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5047" name="self.model.layers.21.self_attn.q_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="5120, 40, 1" offset="3796469880" size="409600" /> + <output> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5048" name="self.model.layers.21.self_attn.q_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5049" name="Constant_386454" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="792684080" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="5050" name="Reshape_386455" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="5051" name="__module.model.layers.21.self_attn.q_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="5052" name="__module.model.layers.21.self_attn.q_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="5053" name="self.model.layers.21.self_attn.q_proj.bias" type="Const" version="opset1"> + <data element_type="bf16" shape="5120" offset="3796879480" size="10240" /> + <output> + <port id="0" precision="BF16" names="self.model.layers.21.self_attn.q_proj.bias"> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="5054" name="__module.model.layers.21.self_attn.q_proj/prim::PythonOp/ConvertLike_1" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="BF16"> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="5055" name="__module.model.layers.21.self_attn.q_proj/prim::PythonOp/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3849,query_states.43"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="5056" name="Constant_301823" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="792694336" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5057" name="__module.model.layers.21.self_attn/aten::view/Reshape" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3857"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5058" name="__module.model.layers.21.self_attn/aten::transpose/ScatterElementsUpdate" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5059" name="__module.model.layers.21.self_attn/aten::transpose/Transpose" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3858,q.43"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5060" name="__module.model.layers.21.self_attn/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3867"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5061" name="__module.model.layers.21.self_attn/aten::size/ShapeOf_3" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5062" name="__module.model.layers.21.self_attn/aten::size/Constant_3" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="5063" name="__module.model.layers.21.self_attn/aten::size/Gather_3" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="3868,3873" /> + </output> + </layer> + <layer id="5064" name="__module.model.layers.21.self_attn/aten::floor_divide/Divide_1" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" /> + </output> + </layer> + <layer id="5065" name="__module.model.layers.21.self_attn/aten::floor_divide/Floor_1" type="Floor" version="opset1"> + <input> + <port id="0" precision="I64" /> + </input> + <output> + <port id="1" precision="I64" names="3870,3871,3875,3876" /> + </output> + </layer> + <layer id="5066" name="Constant_220860" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5067" name="__module.model.layers.21.self_attn/aten::slice/Reshape_5" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5068" name="__module.model.layers.21.self_attn/aten::slice/Reshape_1" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694676" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5069" name="__module.model.layers.21.self_attn/aten::slice/Reshape_2" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5070" name="__module.model.layers.21.self_attn/aten::slice/Reshape_3" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5071" name="__module.model.layers.21.self_attn/aten::slice/Slice" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="3877,x2.85"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="5072" name="Constant_290262" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1, 1" offset="792694684" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5073" name="__module.model.layers.21.self_attn/aten::neg/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3878"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="5074" name="__module.model.layers.21.self_attn/aten::slice/Reshape_4" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5075" name="__module.model.layers.21.self_attn/aten::slice/Reshape_6" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5076" name="__module.model.layers.21.self_attn/aten::slice/Reshape_7" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5077" name="__module.model.layers.21.self_attn/aten::slice/Slice_1" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="3872"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="5078" name="__module.model.layers.21.self_attn/aten::cat/Concat" type="Concat" version="opset1"> + <data axis="-1" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3880"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5079" name="__module.model.layers.21.self_attn/aten::mul/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3881"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5080" name="__module.model.layers.21.self_attn/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3882"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5081" name="Constant_341321" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="5082" name="Constant_341314" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="12" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5083" name="Constant_341316" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5084" name="Constant_341318" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="20" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5085" name="Concat_341319" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5086" name="Broadcast_341322" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32" /> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5087" name="ReadValue_333132" type="ReadValue" version="opset6"> + <data variable_id="past_key_values.21.keypresent.21.key" variable_type="f32" variable_shape="?,8,?,128" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="past_key_values.21.key"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5088" name="Constant_325435" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="5089" name="Gather_325436" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5090" name="self.model.layers.21.self_attn.k_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 128" offset="3796889720" size="2621440" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5091" name="Convert_387407" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5092" name="self.model.layers.21.self_attn.k_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 1" offset="3799511160" size="20480" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5093" name="Convert_387409" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5094" name="self.model.layers.21.self_attn.k_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5095" name="self.model.layers.21.self_attn.k_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="1024, 40, 1" offset="3799531640" size="81920" /> + <output> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5096" name="self.model.layers.21.self_attn.k_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5097" name="Constant_387414" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795418528" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="5098" name="Reshape_387415" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="5099" name="__module.model.layers.21.self_attn.k_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="5100" name="__module.model.layers.21.self_attn.k_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="5101" name="self.model.layers.21.self_attn.k_proj.bias" type="Const" version="opset1"> + <data element_type="bf16" shape="1024" offset="3799613560" size="2048" /> + <output> + <port id="0" precision="BF16" names="self.model.layers.21.self_attn.k_proj.bias"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="5102" name="__module.model.layers.21.self_attn.k_proj/prim::PythonOp/ConvertLike_1" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="BF16"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="5103" name="__module.model.layers.21.self_attn.k_proj/prim::PythonOp/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3852,key_states.89"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="5104" name="Constant_301824" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420592" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5105" name="__module.model.layers.21.self_attn/aten::view/Reshape_1" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3860"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5106" name="__module.model.layers.21.self_attn/aten::transpose/ScatterElementsUpdate_1" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5107" name="__module.model.layers.21.self_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3861,k.43"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5108" name="__module.model.layers.21.self_attn/aten::mul/Multiply_2" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3883"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5109" name="__module.model.layers.21.self_attn/aten::size/ShapeOf_5" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5110" name="__module.model.layers.21.self_attn/aten::size/Constant_5" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="5111" name="__module.model.layers.21.self_attn/aten::size/Gather_5" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="3884,3889" /> + </output> + </layer> + <layer id="5112" name="__module.model.layers.21.self_attn/aten::floor_divide/Divide_3" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" /> + </output> + </layer> + <layer id="5113" name="__module.model.layers.21.self_attn/aten::floor_divide/Floor_3" type="Floor" version="opset1"> + <input> + <port id="0" precision="I64" /> + </input> + <output> + <port id="1" precision="I64" names="3886,3887,3891,3892" /> + </output> + </layer> + <layer id="5114" name="Constant_220861" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5115" name="__module.model.layers.21.self_attn/aten::slice/Reshape_13" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5116" name="__module.model.layers.21.self_attn/aten::slice/Reshape_9" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694676" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5117" name="__module.model.layers.21.self_attn/aten::slice/Reshape_10" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5118" name="__module.model.layers.21.self_attn/aten::slice/Reshape_11" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5119" name="__module.model.layers.21.self_attn/aten::slice/Slice_2" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="3893,x2.87"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="5120" name="Constant_290263" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1, 1" offset="792694684" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5121" name="__module.model.layers.21.self_attn/aten::neg/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3894"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="5122" name="__module.model.layers.21.self_attn/aten::slice/Reshape_12" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5123" name="__module.model.layers.21.self_attn/aten::slice/Reshape_14" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5124" name="__module.model.layers.21.self_attn/aten::slice/Reshape_15" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5125" name="__module.model.layers.21.self_attn/aten::slice/Slice_3" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="3888"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="5126" name="__module.model.layers.21.self_attn/aten::cat/Concat_1" type="Concat" version="opset1"> + <data axis="-1" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3896"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5127" name="__module.model.layers.21.self_attn/aten::mul/Multiply_3" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3897"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5128" name="__module.model.layers.21.self_attn/aten::add/Add_1" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3898"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5129" name="__module.model.layers.21.self_attn/aten::cat/Concat_2" type="Concat" version="opset1"> + <data axis="-2" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="present.21.key"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5130" name="__module.model.layers.21.self_attn/aten::unsqueeze/Unsqueeze_2" type="Unsqueeze" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="FP32" names="3910,3911,3912"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5131" name="__module.model.layers.21.self_attn/aten::size/ShapeOf_6" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5132" name="Constant_302469" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="938477672" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="5133" name="Constant_302470" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="5134" name="Gather_302471" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="5135" name="Constant_268590" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="795420624" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5136" name="Constant_276926" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795420632" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="5137" name="Constant_276927" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="5138" name="Gather_276928" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="5139" name="__module.model.layers.21.self_attn/prim::ListConstruct/Concat_2" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="3" precision="I64" names="3913"> + <dim>5</dim> + </port> + </output> + </layer> + <layer id="5140" name="__module.model.layers.21.self_attn/aten::expand/Broadcast" type="Broadcast" version="opset3"> + <data mode="bidirectional" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>5</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3914,hidden_states.641"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5141" name="Constant_301825" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420648" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5142" name="__module.model.layers.21.self_attn/aten::reshape/Reshape" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3918,key_states.91"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5143" name="Constant_341334" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="5144" name="Constant_341327" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="12" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5145" name="Constant_341329" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5146" name="Constant_341331" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="20" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5147" name="Concat_341332" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5148" name="Broadcast_341335" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32" /> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5149" name="ReadValue_333134" type="ReadValue" version="opset6"> + <data variable_id="past_key_values.21.valuepresent.21.value" variable_type="f32" variable_shape="?,8,?,128" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="past_key_values.21.value"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5150" name="Constant_325438" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="5151" name="Gather_325439" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5152" name="self.model.layers.21.self_attn.v_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 128" offset="3799615608" size="2621440" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5153" name="Convert_387417" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5154" name="self.model.layers.21.self_attn.v_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 1" offset="3802237048" size="20480" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5155" name="Convert_387419" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5156" name="self.model.layers.21.self_attn.v_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5157" name="self.model.layers.21.self_attn.v_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="1024, 40, 1" offset="3802257528" size="81920" /> + <output> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5158" name="self.model.layers.21.self_attn.v_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5159" name="Constant_387424" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795418528" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="5160" name="Reshape_387425" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="5161" name="__module.model.layers.21.self_attn.v_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="5162" name="__module.model.layers.21.self_attn.v_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="5163" name="self.model.layers.21.self_attn.v_proj.bias" type="Const" version="opset1"> + <data element_type="bf16" shape="1024" offset="3802339448" size="2048" /> + <output> + <port id="0" precision="BF16" names="self.model.layers.21.self_attn.v_proj.bias"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="5164" name="__module.model.layers.21.self_attn.v_proj/prim::PythonOp/ConvertLike_1" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="BF16"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="5165" name="__module.model.layers.21.self_attn.v_proj/prim::PythonOp/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3855,value_states.43"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="5166" name="Constant_301826" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420592" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5167" name="__module.model.layers.21.self_attn/aten::view/Reshape_2" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3863"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5168" name="__module.model.layers.21.self_attn/aten::transpose/ScatterElementsUpdate_2" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5169" name="__module.model.layers.21.self_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3864"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5170" name="__module.model.layers.21.self_attn/aten::cat/Concat_3" type="Concat" version="opset1"> + <data axis="-2" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="present.21.value"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5171" name="__module.model.layers.21.self_attn/aten::unsqueeze/Unsqueeze_3" type="Unsqueeze" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="FP32" names="3926,3927,3928"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5172" name="__module.model.layers.21.self_attn/aten::size/ShapeOf_10" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5173" name="Constant_302211" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5174" name="__module.model.layers.21.self_attn/aten::size/Constant_11" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="5175" name="__module.model.layers.21.self_attn/aten::size/Gather_11" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="3920"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5176" name="Constant_268608" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="795420624" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5177" name="Constant_276936" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795420632" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="5178" name="Constant_276937" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="5179" name="Gather_276938" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="5180" name="__module.model.layers.21.self_attn/prim::ListConstruct/Concat_5" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="4" precision="I64" names="3929"> + <dim>5</dim> + </port> + </output> + </layer> + <layer id="5181" name="__module.model.layers.21.self_attn/aten::expand/Broadcast_1" type="Broadcast" version="opset3"> + <data mode="bidirectional" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>5</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3930,hidden_states.645"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5182" name="Constant_301827" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420648" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5183" name="__module.model.layers.21.self_attn/aten::reshape/Reshape_1" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3934"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5184" name="__module.model.layers.21.self_attn/aten::slice/Reshape_60" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5185" name="ShapeOf_299386" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5186" name="Constant_299387" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694668" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5187" name="Constant_299388" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="5188" name="Gather_299389" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5189" name="ShapeOf_299390" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5190" name="Constant_299391" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694668" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5191" name="Constant_299392" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="5192" name="Gather_299393" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5193" name="Add_299394" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64" names="3935"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5194" name="__module.model.layers.21.self_attn/aten::slice/Reshape_62" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5195" name="__module.model.layers.21.self_attn/aten::slice/Reshape_63" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5196" name="__module.model.layers.21.self_attn/aten::slice/Slice_15" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="3939"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="5197" name="__module.model.layers.21.self_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> + <data causal="false" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="3940,attn_output.85"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5198" name="__module.model.layers.21.self_attn/aten::transpose/ScatterElementsUpdate_3" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5199" name="__module.model.layers.21.self_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3941"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5200" name="Constant_301828" type="Const" version="opset1"> + <data element_type="i64" shape="3" offset="798146608" size="24" /> + <output> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="5201" name="__module.model.layers.21.self_attn/aten::view/Reshape_3" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>3</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3944"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="5202" name="self.model.layers.21.self_attn.o_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 128" offset="3802341496" size="13107200" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5203" name="Convert_386457" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5204" name="self.model.layers.21.self_attn.o_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 1" offset="3815448696" size="102400" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5205" name="Convert_386459" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5206" name="self.model.layers.21.self_attn.o_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5207" name="self.model.layers.21.self_attn.o_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="5120, 40, 1" offset="3815551096" size="409600" /> + <output> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5208" name="self.model.layers.21.self_attn.o_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5209" name="Constant_386464" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="792684080" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="5210" name="Reshape_386465" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="5211" name="__module.model.layers.21.self_attn.o_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="5212" name="__module.model.layers.21.self_attn.o_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3946,3948,hidden_states.647"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="5213" name="__module.model.layers.21/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3951,3953,3964,hidden_states.649,hidden_states.651"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="5214" name="Constant_290267" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 5120" offset="3815960696" size="20480" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="5215" name="Constant_290266" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064860" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5216" name="Constant_290264" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064864" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5217" name="__module.model.layers.21.post_attention_layernorm/aten::pow/Power" type="Power" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3954"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="5218" name="Constant_15236" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64" names="3955"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5219" name="__module.model.layers.21.post_attention_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> + <data keep_dims="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3956,variance.87"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5220" name="Constant_290265" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064876" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5221" name="__module.model.layers.21.post_attention_layernorm/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3957"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5222" name="__module.model.layers.21.post_attention_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5223" name="__module.model.layers.21.post_attention_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3958"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5224" name="__module.model.layers.21.post_attention_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3959,3960,hidden_states.653,hidden_states.655"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="5225" name="__module.model.layers.21.post_attention_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3961,3963"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="5226" name="self.model.layers.21.mlp.gate_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 128" offset="3815981176" size="35389440" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5227" name="Convert_385227" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5228" name="self.model.layers.21.mlp.gate_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 1" offset="3851370616" size="276480" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5229" name="Convert_385229" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5230" name="self.model.layers.21.mlp.gate_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5231" name="self.model.layers.21.mlp.gate_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="13824, 40, 1" offset="3851647096" size="1105920" /> + <output> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5232" name="self.model.layers.21.mlp.gate_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5233" name="Constant_385234" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="848558152" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="5234" name="Reshape_385235" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="5235" name="__module.model.layers.21.mlp.gate_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="5236" name="__module.model.layers.21.mlp.gate_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3969,input.43"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="5237" name="__module.model.layers.21.mlp.act_fn/aten::silu/Swish" type="Swish" version="opset4"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="3970"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="5238" name="self.model.layers.21.mlp.up_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 128" offset="3852753016" size="35389440" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5239" name="Convert_385217" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5240" name="self.model.layers.21.mlp.up_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 1" offset="3888142456" size="276480" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5241" name="Convert_385219" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5242" name="self.model.layers.21.mlp.up_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5243" name="self.model.layers.21.mlp.up_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="13824, 40, 1" offset="3888418936" size="1105920" /> + <output> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5244" name="self.model.layers.21.mlp.up_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5245" name="Constant_385224" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="848558152" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="5246" name="Reshape_385225" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="5247" name="__module.model.layers.21.mlp.up_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="5248" name="__module.model.layers.21.mlp.up_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3972"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="5249" name="__module.model.layers.21.mlp/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3973"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="5250" name="self.model.layers.21.mlp.down_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 108, 128" offset="3889524856" size="35389440" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5251" name="Convert_385237" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5252" name="self.model.layers.21.mlp.down_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 108, 1" offset="3924914296" size="276480" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5253" name="Convert_385239" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5254" name="self.model.layers.21.mlp.down_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5255" name="self.model.layers.21.mlp.down_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="5120, 108, 1" offset="3925190776" size="1105920" /> + <output> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5256" name="self.model.layers.21.mlp.down_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5257" name="Constant_385244" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="922101848" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="5258" name="Reshape_385245" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="5259" name="__module.model.layers.21.mlp.down_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="5260" name="__module.model.layers.21.mlp.down_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3975,hidden_states.657"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="5261" name="__module.model.layers.21/aten::add/Add_1" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3976,3978,3986,3997,hidden_states.659,hidden_states.661"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="5262" name="Constant_290271" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 5120" offset="3926296696" size="20480" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="5263" name="Constant_290270" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064860" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5264" name="Constant_290268" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064864" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5265" name="__module.model.layers.22.input_layernorm/aten::pow/Power" type="Power" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3987"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="5266" name="Constant_15310" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64" names="3988"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5267" name="__module.model.layers.22.input_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> + <data keep_dims="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3989,variance.89"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5268" name="Constant_290269" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064876" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5269" name="__module.model.layers.22.input_layernorm/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3990"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5270" name="__module.model.layers.22.input_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5271" name="__module.model.layers.22.input_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3991"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5272" name="__module.model.layers.22.input_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3992,3993,hidden_states.663,hidden_states.665"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="5273" name="__module.model.layers.22.input_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="3994,3996,hidden_states.667"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="5274" name="self.model.layers.22.self_attn.q_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 128" offset="3926317176" size="13107200" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5275" name="Convert_386467" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5276" name="self.model.layers.22.self_attn.q_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 1" offset="3939424376" size="102400" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5277" name="Convert_386469" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5278" name="self.model.layers.22.self_attn.q_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5279" name="self.model.layers.22.self_attn.q_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="5120, 40, 1" offset="3939526776" size="409600" /> + <output> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5280" name="self.model.layers.22.self_attn.q_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5281" name="Constant_386474" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="792684080" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="5282" name="Reshape_386475" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="5283" name="__module.model.layers.22.self_attn.q_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="5284" name="__module.model.layers.22.self_attn.q_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="5285" name="self.model.layers.22.self_attn.q_proj.bias" type="Const" version="opset1"> + <data element_type="bf16" shape="5120" offset="3939936376" size="10240" /> + <output> + <port id="0" precision="BF16" names="self.model.layers.22.self_attn.q_proj.bias"> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="5286" name="__module.model.layers.22.self_attn.q_proj/prim::PythonOp/ConvertLike_1" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="BF16"> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="5287" name="__module.model.layers.22.self_attn.q_proj/prim::PythonOp/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4006,query_states.45"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="5288" name="Constant_301829" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="792694336" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5289" name="__module.model.layers.22.self_attn/aten::view/Reshape" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4014"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5290" name="__module.model.layers.22.self_attn/aten::transpose/ScatterElementsUpdate" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5291" name="__module.model.layers.22.self_attn/aten::transpose/Transpose" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4015,q.45"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5292" name="__module.model.layers.22.self_attn/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4024"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5293" name="__module.model.layers.22.self_attn/aten::size/ShapeOf_3" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5294" name="__module.model.layers.22.self_attn/aten::size/Constant_3" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="5295" name="__module.model.layers.22.self_attn/aten::size/Gather_3" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="4025,4030" /> + </output> + </layer> + <layer id="5296" name="__module.model.layers.22.self_attn/aten::floor_divide/Divide_1" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" /> + </output> + </layer> + <layer id="5297" name="__module.model.layers.22.self_attn/aten::floor_divide/Floor_1" type="Floor" version="opset1"> + <input> + <port id="0" precision="I64" /> + </input> + <output> + <port id="1" precision="I64" names="4027,4028,4032,4033" /> + </output> + </layer> + <layer id="5298" name="Constant_220875" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5299" name="__module.model.layers.22.self_attn/aten::slice/Reshape_5" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5300" name="__module.model.layers.22.self_attn/aten::slice/Reshape_1" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694676" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5301" name="__module.model.layers.22.self_attn/aten::slice/Reshape_2" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5302" name="__module.model.layers.22.self_attn/aten::slice/Reshape_3" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5303" name="__module.model.layers.22.self_attn/aten::slice/Slice" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="4034,x2.89"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="5304" name="Constant_290272" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1, 1" offset="792694684" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5305" name="__module.model.layers.22.self_attn/aten::neg/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4035"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="5306" name="__module.model.layers.22.self_attn/aten::slice/Reshape_4" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5307" name="__module.model.layers.22.self_attn/aten::slice/Reshape_6" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5308" name="__module.model.layers.22.self_attn/aten::slice/Reshape_7" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5309" name="__module.model.layers.22.self_attn/aten::slice/Slice_1" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="4029"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="5310" name="__module.model.layers.22.self_attn/aten::cat/Concat" type="Concat" version="opset1"> + <data axis="-1" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4037"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5311" name="__module.model.layers.22.self_attn/aten::mul/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4038"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5312" name="__module.model.layers.22.self_attn/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4039"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5313" name="Constant_341347" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="5314" name="Constant_341340" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="12" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5315" name="Constant_341342" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5316" name="Constant_341344" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="20" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5317" name="Concat_341345" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5318" name="Broadcast_341348" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32" /> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5319" name="ReadValue_333136" type="ReadValue" version="opset6"> + <data variable_id="past_key_values.22.keypresent.22.key" variable_type="f32" variable_shape="?,8,?,128" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="past_key_values.22.key"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5320" name="Constant_325441" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="5321" name="Gather_325442" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5322" name="self.model.layers.22.self_attn.k_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 128" offset="3939946616" size="2621440" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5323" name="Convert_387427" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5324" name="self.model.layers.22.self_attn.k_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 1" offset="3942568056" size="20480" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5325" name="Convert_387429" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5326" name="self.model.layers.22.self_attn.k_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5327" name="self.model.layers.22.self_attn.k_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="1024, 40, 1" offset="3942588536" size="81920" /> + <output> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5328" name="self.model.layers.22.self_attn.k_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5329" name="Constant_387434" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795418528" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="5330" name="Reshape_387435" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="5331" name="__module.model.layers.22.self_attn.k_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="5332" name="__module.model.layers.22.self_attn.k_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="5333" name="self.model.layers.22.self_attn.k_proj.bias" type="Const" version="opset1"> + <data element_type="bf16" shape="1024" offset="3942670456" size="2048" /> + <output> + <port id="0" precision="BF16" names="self.model.layers.22.self_attn.k_proj.bias"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="5334" name="__module.model.layers.22.self_attn.k_proj/prim::PythonOp/ConvertLike_1" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="BF16"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="5335" name="__module.model.layers.22.self_attn.k_proj/prim::PythonOp/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4009,key_states.93"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="5336" name="Constant_301830" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420592" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5337" name="__module.model.layers.22.self_attn/aten::view/Reshape_1" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4017"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5338" name="__module.model.layers.22.self_attn/aten::transpose/ScatterElementsUpdate_1" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5339" name="__module.model.layers.22.self_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4018,k.45"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5340" name="__module.model.layers.22.self_attn/aten::mul/Multiply_2" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4040"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5341" name="__module.model.layers.22.self_attn/aten::size/ShapeOf_5" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5342" name="__module.model.layers.22.self_attn/aten::size/Constant_5" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="5343" name="__module.model.layers.22.self_attn/aten::size/Gather_5" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="4041,4046" /> + </output> + </layer> + <layer id="5344" name="__module.model.layers.22.self_attn/aten::floor_divide/Divide_3" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" /> + </output> + </layer> + <layer id="5345" name="__module.model.layers.22.self_attn/aten::floor_divide/Floor_3" type="Floor" version="opset1"> + <input> + <port id="0" precision="I64" /> + </input> + <output> + <port id="1" precision="I64" names="4043,4044,4048,4049" /> + </output> + </layer> + <layer id="5346" name="Constant_220876" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5347" name="__module.model.layers.22.self_attn/aten::slice/Reshape_13" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5348" name="__module.model.layers.22.self_attn/aten::slice/Reshape_9" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694676" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5349" name="__module.model.layers.22.self_attn/aten::slice/Reshape_10" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5350" name="__module.model.layers.22.self_attn/aten::slice/Reshape_11" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5351" name="__module.model.layers.22.self_attn/aten::slice/Slice_2" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="4050,x2.91"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="5352" name="Constant_290273" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1, 1" offset="792694684" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5353" name="__module.model.layers.22.self_attn/aten::neg/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4051"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="5354" name="__module.model.layers.22.self_attn/aten::slice/Reshape_12" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5355" name="__module.model.layers.22.self_attn/aten::slice/Reshape_14" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5356" name="__module.model.layers.22.self_attn/aten::slice/Reshape_15" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5357" name="__module.model.layers.22.self_attn/aten::slice/Slice_3" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="4045"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="5358" name="__module.model.layers.22.self_attn/aten::cat/Concat_1" type="Concat" version="opset1"> + <data axis="-1" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4053"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5359" name="__module.model.layers.22.self_attn/aten::mul/Multiply_3" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4054"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5360" name="__module.model.layers.22.self_attn/aten::add/Add_1" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4055"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5361" name="__module.model.layers.22.self_attn/aten::cat/Concat_2" type="Concat" version="opset1"> + <data axis="-2" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="present.22.key"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5362" name="__module.model.layers.22.self_attn/aten::unsqueeze/Unsqueeze_2" type="Unsqueeze" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="FP32" names="4067,4068,4069"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5363" name="__module.model.layers.22.self_attn/aten::size/ShapeOf_6" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5364" name="Constant_302474" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="938477672" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="5365" name="Constant_302475" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="5366" name="Gather_302476" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="5367" name="Constant_268626" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="795420624" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5368" name="Constant_276961" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795420632" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="5369" name="Constant_276962" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="5370" name="Gather_276963" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="5371" name="__module.model.layers.22.self_attn/prim::ListConstruct/Concat_2" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="3" precision="I64" names="4070"> + <dim>5</dim> + </port> + </output> + </layer> + <layer id="5372" name="__module.model.layers.22.self_attn/aten::expand/Broadcast" type="Broadcast" version="opset3"> + <data mode="bidirectional" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>5</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4071,hidden_states.671"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5373" name="Constant_301831" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420648" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5374" name="__module.model.layers.22.self_attn/aten::reshape/Reshape" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4075,key_states.95"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5375" name="Constant_341360" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="5376" name="Constant_341353" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="12" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5377" name="Constant_341355" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5378" name="Constant_341357" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="20" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5379" name="Concat_341358" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5380" name="Broadcast_341361" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32" /> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5381" name="ReadValue_333138" type="ReadValue" version="opset6"> + <data variable_id="past_key_values.22.valuepresent.22.value" variable_type="f32" variable_shape="?,8,?,128" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="past_key_values.22.value"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5382" name="Constant_325444" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="5383" name="Gather_325445" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5384" name="self.model.layers.22.self_attn.v_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 128" offset="3942672504" size="2621440" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5385" name="Convert_387437" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5386" name="self.model.layers.22.self_attn.v_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 1" offset="3945293944" size="20480" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5387" name="Convert_387439" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5388" name="self.model.layers.22.self_attn.v_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5389" name="self.model.layers.22.self_attn.v_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="1024, 40, 1" offset="3945314424" size="81920" /> + <output> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5390" name="self.model.layers.22.self_attn.v_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5391" name="Constant_387444" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795418528" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="5392" name="Reshape_387445" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="5393" name="__module.model.layers.22.self_attn.v_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="5394" name="__module.model.layers.22.self_attn.v_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="5395" name="self.model.layers.22.self_attn.v_proj.bias" type="Const" version="opset1"> + <data element_type="bf16" shape="1024" offset="3945396344" size="2048" /> + <output> + <port id="0" precision="BF16" names="self.model.layers.22.self_attn.v_proj.bias"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="5396" name="__module.model.layers.22.self_attn.v_proj/prim::PythonOp/ConvertLike_1" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="BF16"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="5397" name="__module.model.layers.22.self_attn.v_proj/prim::PythonOp/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4012,value_states.45"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="5398" name="Constant_301832" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420592" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5399" name="__module.model.layers.22.self_attn/aten::view/Reshape_2" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4020"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5400" name="__module.model.layers.22.self_attn/aten::transpose/ScatterElementsUpdate_2" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5401" name="__module.model.layers.22.self_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4021"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5402" name="__module.model.layers.22.self_attn/aten::cat/Concat_3" type="Concat" version="opset1"> + <data axis="-2" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="present.22.value"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5403" name="__module.model.layers.22.self_attn/aten::unsqueeze/Unsqueeze_3" type="Unsqueeze" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="FP32" names="4083,4084,4085"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5404" name="__module.model.layers.22.self_attn/aten::size/ShapeOf_10" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5405" name="Constant_302217" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5406" name="__module.model.layers.22.self_attn/aten::size/Constant_11" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="5407" name="__module.model.layers.22.self_attn/aten::size/Gather_11" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="4077"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5408" name="Constant_268644" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="795420624" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5409" name="Constant_276971" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795420632" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="5410" name="Constant_276972" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="5411" name="Gather_276973" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="5412" name="__module.model.layers.22.self_attn/prim::ListConstruct/Concat_5" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="4" precision="I64" names="4086"> + <dim>5</dim> + </port> + </output> + </layer> + <layer id="5413" name="__module.model.layers.22.self_attn/aten::expand/Broadcast_1" type="Broadcast" version="opset3"> + <data mode="bidirectional" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>5</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4087,hidden_states.675"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5414" name="Constant_301833" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420648" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5415" name="__module.model.layers.22.self_attn/aten::reshape/Reshape_1" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4091"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5416" name="__module.model.layers.22.self_attn/aten::slice/Reshape_60" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5417" name="ShapeOf_299472" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5418" name="Constant_299473" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694668" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5419" name="Constant_299474" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="5420" name="Gather_299475" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5421" name="ShapeOf_299476" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5422" name="Constant_299477" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694668" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5423" name="Constant_299478" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="5424" name="Gather_299479" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5425" name="Add_299480" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64" names="4092"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5426" name="__module.model.layers.22.self_attn/aten::slice/Reshape_62" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5427" name="__module.model.layers.22.self_attn/aten::slice/Reshape_63" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5428" name="__module.model.layers.22.self_attn/aten::slice/Slice_15" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="4096"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="5429" name="__module.model.layers.22.self_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> + <data causal="false" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="4097,attn_output.89"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5430" name="__module.model.layers.22.self_attn/aten::transpose/ScatterElementsUpdate_3" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5431" name="__module.model.layers.22.self_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4098"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5432" name="Constant_301834" type="Const" version="opset1"> + <data element_type="i64" shape="3" offset="798146608" size="24" /> + <output> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="5433" name="__module.model.layers.22.self_attn/aten::view/Reshape_3" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>3</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4101"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="5434" name="self.model.layers.22.self_attn.o_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 128" offset="3945398392" size="13107200" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5435" name="Convert_386477" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5436" name="self.model.layers.22.self_attn.o_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 1" offset="3958505592" size="102400" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5437" name="Convert_386479" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5438" name="self.model.layers.22.self_attn.o_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5439" name="self.model.layers.22.self_attn.o_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="5120, 40, 1" offset="3958607992" size="409600" /> + <output> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5440" name="self.model.layers.22.self_attn.o_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5441" name="Constant_386484" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="792684080" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="5442" name="Reshape_386485" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="5443" name="__module.model.layers.22.self_attn.o_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="5444" name="__module.model.layers.22.self_attn.o_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4103,4105,hidden_states.677"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="5445" name="__module.model.layers.22/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4108,4110,4121,hidden_states.679,hidden_states.681"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="5446" name="Constant_290277" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 5120" offset="3959017592" size="20480" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="5447" name="Constant_290276" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064860" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5448" name="Constant_290274" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064864" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5449" name="__module.model.layers.22.post_attention_layernorm/aten::pow/Power" type="Power" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4111"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="5450" name="Constant_15908" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64" names="4112"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5451" name="__module.model.layers.22.post_attention_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> + <data keep_dims="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4113,variance.91"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5452" name="Constant_290275" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064876" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5453" name="__module.model.layers.22.post_attention_layernorm/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4114"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5454" name="__module.model.layers.22.post_attention_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5455" name="__module.model.layers.22.post_attention_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4115"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5456" name="__module.model.layers.22.post_attention_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4116,4117,hidden_states.683,hidden_states.685"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="5457" name="__module.model.layers.22.post_attention_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4118,4120"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="5458" name="self.model.layers.22.mlp.gate_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 128" offset="3959038072" size="35389440" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5459" name="Convert_385257" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5460" name="self.model.layers.22.mlp.gate_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 1" offset="3994427512" size="276480" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5461" name="Convert_385259" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5462" name="self.model.layers.22.mlp.gate_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5463" name="self.model.layers.22.mlp.gate_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="13824, 40, 1" offset="3994703992" size="1105920" /> + <output> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5464" name="self.model.layers.22.mlp.gate_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5465" name="Constant_385264" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="848558152" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="5466" name="Reshape_385265" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="5467" name="__module.model.layers.22.mlp.gate_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="5468" name="__module.model.layers.22.mlp.gate_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4126,input.45"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="5469" name="__module.model.layers.22.mlp.act_fn/aten::silu/Swish" type="Swish" version="opset4"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="4127"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="5470" name="self.model.layers.22.mlp.up_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 128" offset="3995809912" size="35389440" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5471" name="Convert_385247" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5472" name="self.model.layers.22.mlp.up_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 1" offset="4031199352" size="276480" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5473" name="Convert_385249" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5474" name="self.model.layers.22.mlp.up_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5475" name="self.model.layers.22.mlp.up_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="13824, 40, 1" offset="4031475832" size="1105920" /> + <output> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5476" name="self.model.layers.22.mlp.up_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5477" name="Constant_385254" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="848558152" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="5478" name="Reshape_385255" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="5479" name="__module.model.layers.22.mlp.up_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="5480" name="__module.model.layers.22.mlp.up_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4129"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="5481" name="__module.model.layers.22.mlp/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4130"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="5482" name="self.model.layers.22.mlp.down_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 108, 128" offset="4032581752" size="35389440" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5483" name="Convert_385267" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5484" name="self.model.layers.22.mlp.down_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 108, 1" offset="4067971192" size="276480" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5485" name="Convert_385269" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5486" name="self.model.layers.22.mlp.down_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5487" name="self.model.layers.22.mlp.down_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="5120, 108, 1" offset="4068247672" size="1105920" /> + <output> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5488" name="self.model.layers.22.mlp.down_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5489" name="Constant_385274" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="922101848" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="5490" name="Reshape_385275" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="5491" name="__module.model.layers.22.mlp.down_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="5492" name="__module.model.layers.22.mlp.down_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4132,hidden_states.687"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="5493" name="__module.model.layers.22/aten::add/Add_1" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4133,4135,4143,4154,hidden_states.689,hidden_states.691"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="5494" name="Constant_290281" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 5120" offset="4069353592" size="20480" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="5495" name="Constant_290280" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064860" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5496" name="Constant_290278" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064864" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5497" name="__module.model.layers.23.input_layernorm/aten::pow/Power" type="Power" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4144"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="5498" name="Constant_15982" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64" names="4145"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5499" name="__module.model.layers.23.input_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> + <data keep_dims="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4146,variance.93"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5500" name="Constant_290279" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064876" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5501" name="__module.model.layers.23.input_layernorm/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4147"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5502" name="__module.model.layers.23.input_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5503" name="__module.model.layers.23.input_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4148"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5504" name="__module.model.layers.23.input_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4149,4150,hidden_states.693,hidden_states.695"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="5505" name="__module.model.layers.23.input_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4151,4153,hidden_states.697"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="5506" name="self.model.layers.23.self_attn.q_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 128" offset="4069374072" size="13107200" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5507" name="Convert_386487" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5508" name="self.model.layers.23.self_attn.q_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 1" offset="4082481272" size="102400" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5509" name="Convert_386489" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5510" name="self.model.layers.23.self_attn.q_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5511" name="self.model.layers.23.self_attn.q_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="5120, 40, 1" offset="4082583672" size="409600" /> + <output> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5512" name="self.model.layers.23.self_attn.q_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5513" name="Constant_386494" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="792684080" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="5514" name="Reshape_386495" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="5515" name="__module.model.layers.23.self_attn.q_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="5516" name="__module.model.layers.23.self_attn.q_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="5517" name="self.model.layers.23.self_attn.q_proj.bias" type="Const" version="opset1"> + <data element_type="bf16" shape="5120" offset="4082993272" size="10240" /> + <output> + <port id="0" precision="BF16" names="self.model.layers.23.self_attn.q_proj.bias"> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="5518" name="__module.model.layers.23.self_attn.q_proj/prim::PythonOp/ConvertLike_1" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="BF16"> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="5519" name="__module.model.layers.23.self_attn.q_proj/prim::PythonOp/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4163,query_states.47"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="5520" name="Constant_301835" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="792694336" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5521" name="__module.model.layers.23.self_attn/aten::view/Reshape" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4171"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5522" name="__module.model.layers.23.self_attn/aten::transpose/ScatterElementsUpdate" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5523" name="__module.model.layers.23.self_attn/aten::transpose/Transpose" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4172,q.47"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5524" name="__module.model.layers.23.self_attn/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4181"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5525" name="__module.model.layers.23.self_attn/aten::size/ShapeOf_3" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5526" name="__module.model.layers.23.self_attn/aten::size/Constant_3" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="5527" name="__module.model.layers.23.self_attn/aten::size/Gather_3" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="4182,4187" /> + </output> + </layer> + <layer id="5528" name="__module.model.layers.23.self_attn/aten::floor_divide/Divide_1" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" /> + </output> + </layer> + <layer id="5529" name="__module.model.layers.23.self_attn/aten::floor_divide/Floor_1" type="Floor" version="opset1"> + <input> + <port id="0" precision="I64" /> + </input> + <output> + <port id="1" precision="I64" names="4184,4185,4189,4190" /> + </output> + </layer> + <layer id="5530" name="Constant_220890" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5531" name="__module.model.layers.23.self_attn/aten::slice/Reshape_5" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5532" name="__module.model.layers.23.self_attn/aten::slice/Reshape_1" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694676" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5533" name="__module.model.layers.23.self_attn/aten::slice/Reshape_2" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5534" name="__module.model.layers.23.self_attn/aten::slice/Reshape_3" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5535" name="__module.model.layers.23.self_attn/aten::slice/Slice" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="4191,x2.93"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="5536" name="Constant_290282" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1, 1" offset="792694684" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5537" name="__module.model.layers.23.self_attn/aten::neg/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4192"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="5538" name="__module.model.layers.23.self_attn/aten::slice/Reshape_4" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5539" name="__module.model.layers.23.self_attn/aten::slice/Reshape_6" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5540" name="__module.model.layers.23.self_attn/aten::slice/Reshape_7" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5541" name="__module.model.layers.23.self_attn/aten::slice/Slice_1" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="4186"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="5542" name="__module.model.layers.23.self_attn/aten::cat/Concat" type="Concat" version="opset1"> + <data axis="-1" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4194"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5543" name="__module.model.layers.23.self_attn/aten::mul/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4195"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5544" name="__module.model.layers.23.self_attn/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4196"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5545" name="Constant_341373" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="5546" name="Constant_341366" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="12" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5547" name="Constant_341368" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5548" name="Constant_341370" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="20" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5549" name="Concat_341371" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5550" name="Broadcast_341374" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32" /> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5551" name="ReadValue_333140" type="ReadValue" version="opset6"> + <data variable_id="past_key_values.23.keypresent.23.key" variable_type="f32" variable_shape="?,8,?,128" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="past_key_values.23.key"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5552" name="Constant_325447" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="5553" name="Gather_325448" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5554" name="self.model.layers.23.self_attn.k_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 128" offset="4083003512" size="2621440" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5555" name="Convert_387447" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5556" name="self.model.layers.23.self_attn.k_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 1" offset="4085624952" size="20480" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5557" name="Convert_387449" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5558" name="self.model.layers.23.self_attn.k_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5559" name="self.model.layers.23.self_attn.k_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="1024, 40, 1" offset="4085645432" size="81920" /> + <output> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5560" name="self.model.layers.23.self_attn.k_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5561" name="Constant_387454" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795418528" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="5562" name="Reshape_387455" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="5563" name="__module.model.layers.23.self_attn.k_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="5564" name="__module.model.layers.23.self_attn.k_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="5565" name="self.model.layers.23.self_attn.k_proj.bias" type="Const" version="opset1"> + <data element_type="bf16" shape="1024" offset="4085727352" size="2048" /> + <output> + <port id="0" precision="BF16" names="self.model.layers.23.self_attn.k_proj.bias"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="5566" name="__module.model.layers.23.self_attn.k_proj/prim::PythonOp/ConvertLike_1" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="BF16"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="5567" name="__module.model.layers.23.self_attn.k_proj/prim::PythonOp/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4166,key_states.97"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="5568" name="Constant_301836" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420592" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5569" name="__module.model.layers.23.self_attn/aten::view/Reshape_1" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4174"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5570" name="__module.model.layers.23.self_attn/aten::transpose/ScatterElementsUpdate_1" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5571" name="__module.model.layers.23.self_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4175,k.47"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5572" name="__module.model.layers.23.self_attn/aten::mul/Multiply_2" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4197"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5573" name="__module.model.layers.23.self_attn/aten::size/ShapeOf_5" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5574" name="__module.model.layers.23.self_attn/aten::size/Constant_5" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="5575" name="__module.model.layers.23.self_attn/aten::size/Gather_5" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="4198,4203" /> + </output> + </layer> + <layer id="5576" name="__module.model.layers.23.self_attn/aten::floor_divide/Divide_3" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" /> + </output> + </layer> + <layer id="5577" name="__module.model.layers.23.self_attn/aten::floor_divide/Floor_3" type="Floor" version="opset1"> + <input> + <port id="0" precision="I64" /> + </input> + <output> + <port id="1" precision="I64" names="4200,4201,4205,4206" /> + </output> + </layer> + <layer id="5578" name="Constant_220891" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5579" name="__module.model.layers.23.self_attn/aten::slice/Reshape_13" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5580" name="__module.model.layers.23.self_attn/aten::slice/Reshape_9" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694676" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5581" name="__module.model.layers.23.self_attn/aten::slice/Reshape_10" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5582" name="__module.model.layers.23.self_attn/aten::slice/Reshape_11" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5583" name="__module.model.layers.23.self_attn/aten::slice/Slice_2" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="4207,x2.95"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="5584" name="Constant_290283" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1, 1" offset="792694684" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5585" name="__module.model.layers.23.self_attn/aten::neg/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4208"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="5586" name="__module.model.layers.23.self_attn/aten::slice/Reshape_12" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5587" name="__module.model.layers.23.self_attn/aten::slice/Reshape_14" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5588" name="__module.model.layers.23.self_attn/aten::slice/Reshape_15" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5589" name="__module.model.layers.23.self_attn/aten::slice/Slice_3" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="4202"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="5590" name="__module.model.layers.23.self_attn/aten::cat/Concat_1" type="Concat" version="opset1"> + <data axis="-1" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4210"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5591" name="__module.model.layers.23.self_attn/aten::mul/Multiply_3" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4211"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5592" name="__module.model.layers.23.self_attn/aten::add/Add_1" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4212"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5593" name="__module.model.layers.23.self_attn/aten::cat/Concat_2" type="Concat" version="opset1"> + <data axis="-2" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="present.23.key"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5594" name="__module.model.layers.23.self_attn/aten::unsqueeze/Unsqueeze_2" type="Unsqueeze" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="FP32" names="4224,4225,4226"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5595" name="__module.model.layers.23.self_attn/aten::size/ShapeOf_6" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5596" name="Constant_302479" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="938477672" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="5597" name="Constant_302480" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="5598" name="Gather_302481" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="5599" name="Constant_268662" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="795420624" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5600" name="Constant_276996" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795420632" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="5601" name="Constant_276997" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="5602" name="Gather_276998" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="5603" name="__module.model.layers.23.self_attn/prim::ListConstruct/Concat_2" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="3" precision="I64" names="4227"> + <dim>5</dim> + </port> + </output> + </layer> + <layer id="5604" name="__module.model.layers.23.self_attn/aten::expand/Broadcast" type="Broadcast" version="opset3"> + <data mode="bidirectional" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>5</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4228,hidden_states.701"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5605" name="Constant_301837" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420648" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5606" name="__module.model.layers.23.self_attn/aten::reshape/Reshape" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4232,key_states.99"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5607" name="Constant_341386" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="5608" name="Constant_341379" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="12" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5609" name="Constant_341381" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5610" name="Constant_341383" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="20" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5611" name="Concat_341384" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5612" name="Broadcast_341387" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32" /> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5613" name="ReadValue_333142" type="ReadValue" version="opset6"> + <data variable_id="past_key_values.23.valuepresent.23.value" variable_type="f32" variable_shape="?,8,?,128" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="past_key_values.23.value"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5614" name="Constant_325450" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="5615" name="Gather_325451" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5616" name="self.model.layers.23.self_attn.v_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 128" offset="4085729400" size="2621440" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5617" name="Convert_387457" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5618" name="self.model.layers.23.self_attn.v_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 1" offset="4088350840" size="20480" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5619" name="Convert_387459" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5620" name="self.model.layers.23.self_attn.v_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5621" name="self.model.layers.23.self_attn.v_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="1024, 40, 1" offset="4088371320" size="81920" /> + <output> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5622" name="self.model.layers.23.self_attn.v_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5623" name="Constant_387464" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795418528" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="5624" name="Reshape_387465" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="5625" name="__module.model.layers.23.self_attn.v_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="5626" name="__module.model.layers.23.self_attn.v_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="5627" name="self.model.layers.23.self_attn.v_proj.bias" type="Const" version="opset1"> + <data element_type="bf16" shape="1024" offset="4088453240" size="2048" /> + <output> + <port id="0" precision="BF16" names="self.model.layers.23.self_attn.v_proj.bias"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="5628" name="__module.model.layers.23.self_attn.v_proj/prim::PythonOp/ConvertLike_1" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="BF16"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="5629" name="__module.model.layers.23.self_attn.v_proj/prim::PythonOp/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4169,value_states.47"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="5630" name="Constant_301838" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420592" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5631" name="__module.model.layers.23.self_attn/aten::view/Reshape_2" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4177"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5632" name="__module.model.layers.23.self_attn/aten::transpose/ScatterElementsUpdate_2" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5633" name="__module.model.layers.23.self_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4178"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5634" name="__module.model.layers.23.self_attn/aten::cat/Concat_3" type="Concat" version="opset1"> + <data axis="-2" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="present.23.value"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5635" name="__module.model.layers.23.self_attn/aten::unsqueeze/Unsqueeze_3" type="Unsqueeze" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="FP32" names="4240,4241,4242"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5636" name="__module.model.layers.23.self_attn/aten::size/ShapeOf_10" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5637" name="Constant_302223" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5638" name="__module.model.layers.23.self_attn/aten::size/Constant_11" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="5639" name="__module.model.layers.23.self_attn/aten::size/Gather_11" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="4234"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5640" name="Constant_268680" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="795420624" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5641" name="Constant_277006" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795420632" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="5642" name="Constant_277007" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="5643" name="Gather_277008" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="5644" name="__module.model.layers.23.self_attn/prim::ListConstruct/Concat_5" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="4" precision="I64" names="4243"> + <dim>5</dim> + </port> + </output> + </layer> + <layer id="5645" name="__module.model.layers.23.self_attn/aten::expand/Broadcast_1" type="Broadcast" version="opset3"> + <data mode="bidirectional" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>5</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4244,hidden_states.705"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5646" name="Constant_301839" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420648" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5647" name="__module.model.layers.23.self_attn/aten::reshape/Reshape_1" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4248"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5648" name="__module.model.layers.23.self_attn/aten::slice/Reshape_60" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5649" name="ShapeOf_299558" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5650" name="Constant_299559" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694668" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5651" name="Constant_299560" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="5652" name="Gather_299561" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5653" name="ShapeOf_299562" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5654" name="Constant_299563" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694668" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5655" name="Constant_299564" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="5656" name="Gather_299565" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5657" name="Add_299566" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64" names="4249"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5658" name="__module.model.layers.23.self_attn/aten::slice/Reshape_62" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5659" name="__module.model.layers.23.self_attn/aten::slice/Reshape_63" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5660" name="__module.model.layers.23.self_attn/aten::slice/Slice_15" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="4253"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="5661" name="__module.model.layers.23.self_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> + <data causal="false" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="4254,attn_output.93"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5662" name="__module.model.layers.23.self_attn/aten::transpose/ScatterElementsUpdate_3" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5663" name="__module.model.layers.23.self_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4255"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5664" name="Constant_301840" type="Const" version="opset1"> + <data element_type="i64" shape="3" offset="798146608" size="24" /> + <output> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="5665" name="__module.model.layers.23.self_attn/aten::view/Reshape_3" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>3</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4258"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="5666" name="self.model.layers.23.self_attn.o_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 128" offset="4088455288" size="13107200" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5667" name="Convert_386497" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5668" name="self.model.layers.23.self_attn.o_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 1" offset="4101562488" size="102400" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5669" name="Convert_386499" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5670" name="self.model.layers.23.self_attn.o_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5671" name="self.model.layers.23.self_attn.o_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="5120, 40, 1" offset="4101664888" size="409600" /> + <output> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5672" name="self.model.layers.23.self_attn.o_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5673" name="Constant_386504" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="792684080" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="5674" name="Reshape_386505" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="5675" name="__module.model.layers.23.self_attn.o_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="5676" name="__module.model.layers.23.self_attn.o_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4260,4262,hidden_states.707"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="5677" name="__module.model.layers.23/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4265,4267,4278,hidden_states.709,hidden_states.711"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="5678" name="Constant_290287" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 5120" offset="4102074488" size="20480" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="5679" name="Constant_290286" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064860" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5680" name="Constant_290284" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064864" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5681" name="__module.model.layers.23.post_attention_layernorm/aten::pow/Power" type="Power" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4268"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="5682" name="Constant_16580" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64" names="4269"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5683" name="__module.model.layers.23.post_attention_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> + <data keep_dims="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4270,variance.95"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5684" name="Constant_290285" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064876" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5685" name="__module.model.layers.23.post_attention_layernorm/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4271"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5686" name="__module.model.layers.23.post_attention_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5687" name="__module.model.layers.23.post_attention_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4272"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5688" name="__module.model.layers.23.post_attention_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4273,4274,hidden_states.713,hidden_states.715"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="5689" name="__module.model.layers.23.post_attention_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4275,4277"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="5690" name="self.model.layers.23.mlp.gate_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 128" offset="4102094968" size="35389440" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5691" name="Convert_385287" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5692" name="self.model.layers.23.mlp.gate_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 1" offset="4137484408" size="276480" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5693" name="Convert_385289" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5694" name="self.model.layers.23.mlp.gate_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5695" name="self.model.layers.23.mlp.gate_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="13824, 40, 1" offset="4137760888" size="1105920" /> + <output> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5696" name="self.model.layers.23.mlp.gate_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5697" name="Constant_385294" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="848558152" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="5698" name="Reshape_385295" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="5699" name="__module.model.layers.23.mlp.gate_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="5700" name="__module.model.layers.23.mlp.gate_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4283,input.47"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="5701" name="__module.model.layers.23.mlp.act_fn/aten::silu/Swish" type="Swish" version="opset4"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="4284"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="5702" name="self.model.layers.23.mlp.up_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 128" offset="4138866808" size="35389440" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5703" name="Convert_385277" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5704" name="self.model.layers.23.mlp.up_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 1" offset="4174256248" size="276480" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5705" name="Convert_385279" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5706" name="self.model.layers.23.mlp.up_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5707" name="self.model.layers.23.mlp.up_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="13824, 40, 1" offset="4174532728" size="1105920" /> + <output> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5708" name="self.model.layers.23.mlp.up_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5709" name="Constant_385284" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="848558152" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="5710" name="Reshape_385285" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="5711" name="__module.model.layers.23.mlp.up_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="5712" name="__module.model.layers.23.mlp.up_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4286"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="5713" name="__module.model.layers.23.mlp/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4287"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="5714" name="self.model.layers.23.mlp.down_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 108, 128" offset="4175638648" size="35389440" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5715" name="Convert_385297" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5716" name="self.model.layers.23.mlp.down_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 108, 1" offset="4211028088" size="276480" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5717" name="Convert_385299" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5718" name="self.model.layers.23.mlp.down_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5719" name="self.model.layers.23.mlp.down_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="5120, 108, 1" offset="4211304568" size="1105920" /> + <output> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5720" name="self.model.layers.23.mlp.down_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5721" name="Constant_385304" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="922101848" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="5722" name="Reshape_385305" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="5723" name="__module.model.layers.23.mlp.down_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="5724" name="__module.model.layers.23.mlp.down_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4289,hidden_states.717"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="5725" name="__module.model.layers.23/aten::add/Add_1" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4290,4292,4300,4311,hidden_states.719,hidden_states.721"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="5726" name="Constant_290291" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 5120" offset="4212410488" size="20480" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="5727" name="Constant_290290" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064860" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5728" name="Constant_290288" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064864" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5729" name="__module.model.layers.24.input_layernorm/aten::pow/Power" type="Power" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4301"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="5730" name="Constant_16654" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64" names="4302"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5731" name="__module.model.layers.24.input_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> + <data keep_dims="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4303,variance.97"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5732" name="Constant_290289" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064876" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5733" name="__module.model.layers.24.input_layernorm/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4304"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5734" name="__module.model.layers.24.input_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5735" name="__module.model.layers.24.input_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4305"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5736" name="__module.model.layers.24.input_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4306,4307,hidden_states.723,hidden_states.725"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="5737" name="__module.model.layers.24.input_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4308,4310,hidden_states.727"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="5738" name="self.model.layers.24.self_attn.q_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 128" offset="4212430968" size="13107200" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5739" name="Convert_386507" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5740" name="self.model.layers.24.self_attn.q_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 1" offset="4225538168" size="102400" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5741" name="Convert_386509" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5742" name="self.model.layers.24.self_attn.q_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5743" name="self.model.layers.24.self_attn.q_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="5120, 40, 1" offset="4225640568" size="409600" /> + <output> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5744" name="self.model.layers.24.self_attn.q_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5745" name="Constant_386514" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="792684080" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="5746" name="Reshape_386515" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="5747" name="__module.model.layers.24.self_attn.q_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="5748" name="__module.model.layers.24.self_attn.q_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="5749" name="self.model.layers.24.self_attn.q_proj.bias" type="Const" version="opset1"> + <data element_type="bf16" shape="5120" offset="4226050168" size="10240" /> + <output> + <port id="0" precision="BF16" names="self.model.layers.24.self_attn.q_proj.bias"> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="5750" name="__module.model.layers.24.self_attn.q_proj/prim::PythonOp/ConvertLike_1" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="BF16"> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="5751" name="__module.model.layers.24.self_attn.q_proj/prim::PythonOp/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4320,query_states.49"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="5752" name="Constant_301841" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="792694336" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5753" name="__module.model.layers.24.self_attn/aten::view/Reshape" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4328"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5754" name="__module.model.layers.24.self_attn/aten::transpose/ScatterElementsUpdate" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5755" name="__module.model.layers.24.self_attn/aten::transpose/Transpose" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4329,q.49"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5756" name="__module.model.layers.24.self_attn/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4338"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5757" name="__module.model.layers.24.self_attn/aten::size/ShapeOf_3" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5758" name="__module.model.layers.24.self_attn/aten::size/Constant_3" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="5759" name="__module.model.layers.24.self_attn/aten::size/Gather_3" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="4339,4344" /> + </output> + </layer> + <layer id="5760" name="__module.model.layers.24.self_attn/aten::floor_divide/Divide_1" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" /> + </output> + </layer> + <layer id="5761" name="__module.model.layers.24.self_attn/aten::floor_divide/Floor_1" type="Floor" version="opset1"> + <input> + <port id="0" precision="I64" /> + </input> + <output> + <port id="1" precision="I64" names="4341,4342,4346,4347" /> + </output> + </layer> + <layer id="5762" name="Constant_220905" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5763" name="__module.model.layers.24.self_attn/aten::slice/Reshape_5" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5764" name="__module.model.layers.24.self_attn/aten::slice/Reshape_1" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694676" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5765" name="__module.model.layers.24.self_attn/aten::slice/Reshape_2" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5766" name="__module.model.layers.24.self_attn/aten::slice/Reshape_3" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5767" name="__module.model.layers.24.self_attn/aten::slice/Slice" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="4348,x2.97"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="5768" name="Constant_290292" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1, 1" offset="792694684" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5769" name="__module.model.layers.24.self_attn/aten::neg/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4349"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="5770" name="__module.model.layers.24.self_attn/aten::slice/Reshape_4" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5771" name="__module.model.layers.24.self_attn/aten::slice/Reshape_6" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5772" name="__module.model.layers.24.self_attn/aten::slice/Reshape_7" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5773" name="__module.model.layers.24.self_attn/aten::slice/Slice_1" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="4343"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="5774" name="__module.model.layers.24.self_attn/aten::cat/Concat" type="Concat" version="opset1"> + <data axis="-1" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4351"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5775" name="__module.model.layers.24.self_attn/aten::mul/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4352"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5776" name="__module.model.layers.24.self_attn/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4353"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5777" name="Constant_341399" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="5778" name="Constant_341392" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="12" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5779" name="Constant_341394" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5780" name="Constant_341396" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="20" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5781" name="Concat_341397" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5782" name="Broadcast_341400" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32" /> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5783" name="ReadValue_333144" type="ReadValue" version="opset6"> + <data variable_id="past_key_values.24.keypresent.24.key" variable_type="f32" variable_shape="?,8,?,128" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="past_key_values.24.key"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5784" name="Constant_325453" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="5785" name="Gather_325454" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5786" name="self.model.layers.24.self_attn.k_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 128" offset="4226060408" size="2621440" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5787" name="Convert_387467" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5788" name="self.model.layers.24.self_attn.k_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 1" offset="4228681848" size="20480" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5789" name="Convert_387469" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5790" name="self.model.layers.24.self_attn.k_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5791" name="self.model.layers.24.self_attn.k_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="1024, 40, 1" offset="4228702328" size="81920" /> + <output> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5792" name="self.model.layers.24.self_attn.k_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5793" name="Constant_387474" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795418528" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="5794" name="Reshape_387475" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="5795" name="__module.model.layers.24.self_attn.k_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="5796" name="__module.model.layers.24.self_attn.k_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="5797" name="self.model.layers.24.self_attn.k_proj.bias" type="Const" version="opset1"> + <data element_type="bf16" shape="1024" offset="4228784248" size="2048" /> + <output> + <port id="0" precision="BF16" names="self.model.layers.24.self_attn.k_proj.bias"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="5798" name="__module.model.layers.24.self_attn.k_proj/prim::PythonOp/ConvertLike_1" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="BF16"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="5799" name="__module.model.layers.24.self_attn.k_proj/prim::PythonOp/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4323,key_states.101"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="5800" name="Constant_301842" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420592" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5801" name="__module.model.layers.24.self_attn/aten::view/Reshape_1" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4331"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5802" name="__module.model.layers.24.self_attn/aten::transpose/ScatterElementsUpdate_1" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5803" name="__module.model.layers.24.self_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4332,k.49"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5804" name="__module.model.layers.24.self_attn/aten::mul/Multiply_2" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4354"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5805" name="__module.model.layers.24.self_attn/aten::size/ShapeOf_5" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5806" name="__module.model.layers.24.self_attn/aten::size/Constant_5" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="5807" name="__module.model.layers.24.self_attn/aten::size/Gather_5" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="4355,4360" /> + </output> + </layer> + <layer id="5808" name="__module.model.layers.24.self_attn/aten::floor_divide/Divide_3" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" /> + </output> + </layer> + <layer id="5809" name="__module.model.layers.24.self_attn/aten::floor_divide/Floor_3" type="Floor" version="opset1"> + <input> + <port id="0" precision="I64" /> + </input> + <output> + <port id="1" precision="I64" names="4357,4358,4362,4363" /> + </output> + </layer> + <layer id="5810" name="Constant_220906" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5811" name="__module.model.layers.24.self_attn/aten::slice/Reshape_13" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5812" name="__module.model.layers.24.self_attn/aten::slice/Reshape_9" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694676" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5813" name="__module.model.layers.24.self_attn/aten::slice/Reshape_10" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5814" name="__module.model.layers.24.self_attn/aten::slice/Reshape_11" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5815" name="__module.model.layers.24.self_attn/aten::slice/Slice_2" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="4364,x2.99"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="5816" name="Constant_290293" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1, 1" offset="792694684" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5817" name="__module.model.layers.24.self_attn/aten::neg/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4365"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="5818" name="__module.model.layers.24.self_attn/aten::slice/Reshape_12" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5819" name="__module.model.layers.24.self_attn/aten::slice/Reshape_14" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5820" name="__module.model.layers.24.self_attn/aten::slice/Reshape_15" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5821" name="__module.model.layers.24.self_attn/aten::slice/Slice_3" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="4359"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="5822" name="__module.model.layers.24.self_attn/aten::cat/Concat_1" type="Concat" version="opset1"> + <data axis="-1" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4367"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5823" name="__module.model.layers.24.self_attn/aten::mul/Multiply_3" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4368"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5824" name="__module.model.layers.24.self_attn/aten::add/Add_1" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4369"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5825" name="__module.model.layers.24.self_attn/aten::cat/Concat_2" type="Concat" version="opset1"> + <data axis="-2" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="present.24.key"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5826" name="__module.model.layers.24.self_attn/aten::unsqueeze/Unsqueeze_2" type="Unsqueeze" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="FP32" names="4381,4382,4383"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5827" name="__module.model.layers.24.self_attn/aten::size/ShapeOf_6" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5828" name="Constant_302484" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="938477672" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="5829" name="Constant_302485" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="5830" name="Gather_302486" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="5831" name="Constant_268698" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="795420624" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5832" name="Constant_277031" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795420632" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="5833" name="Constant_277032" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="5834" name="Gather_277033" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="5835" name="__module.model.layers.24.self_attn/prim::ListConstruct/Concat_2" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="3" precision="I64" names="4384"> + <dim>5</dim> + </port> + </output> + </layer> + <layer id="5836" name="__module.model.layers.24.self_attn/aten::expand/Broadcast" type="Broadcast" version="opset3"> + <data mode="bidirectional" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>5</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4385,hidden_states.731"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5837" name="Constant_301843" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420648" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5838" name="__module.model.layers.24.self_attn/aten::reshape/Reshape" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4389,key_states.103"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5839" name="Constant_341412" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="5840" name="Constant_341405" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="12" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5841" name="Constant_341407" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5842" name="Constant_341409" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="20" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5843" name="Concat_341410" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5844" name="Broadcast_341413" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32" /> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5845" name="ReadValue_333146" type="ReadValue" version="opset6"> + <data variable_id="past_key_values.24.valuepresent.24.value" variable_type="f32" variable_shape="?,8,?,128" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="past_key_values.24.value"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5846" name="Constant_325456" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="5847" name="Gather_325457" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5848" name="self.model.layers.24.self_attn.v_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 128" offset="4228786296" size="2621440" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5849" name="Convert_387477" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5850" name="self.model.layers.24.self_attn.v_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 1" offset="4231407736" size="20480" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5851" name="Convert_387479" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5852" name="self.model.layers.24.self_attn.v_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5853" name="self.model.layers.24.self_attn.v_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="1024, 40, 1" offset="4231428216" size="81920" /> + <output> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5854" name="self.model.layers.24.self_attn.v_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5855" name="Constant_387484" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795418528" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="5856" name="Reshape_387485" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="5857" name="__module.model.layers.24.self_attn.v_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="5858" name="__module.model.layers.24.self_attn.v_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="5859" name="self.model.layers.24.self_attn.v_proj.bias" type="Const" version="opset1"> + <data element_type="bf16" shape="1024" offset="4231510136" size="2048" /> + <output> + <port id="0" precision="BF16" names="self.model.layers.24.self_attn.v_proj.bias"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="5860" name="__module.model.layers.24.self_attn.v_proj/prim::PythonOp/ConvertLike_1" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="BF16"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="5861" name="__module.model.layers.24.self_attn.v_proj/prim::PythonOp/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4326,value_states.49"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="5862" name="Constant_301844" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420592" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5863" name="__module.model.layers.24.self_attn/aten::view/Reshape_2" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4334"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5864" name="__module.model.layers.24.self_attn/aten::transpose/ScatterElementsUpdate_2" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5865" name="__module.model.layers.24.self_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4335"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5866" name="__module.model.layers.24.self_attn/aten::cat/Concat_3" type="Concat" version="opset1"> + <data axis="-2" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="present.24.value"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5867" name="__module.model.layers.24.self_attn/aten::unsqueeze/Unsqueeze_3" type="Unsqueeze" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="FP32" names="4397,4398,4399"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5868" name="__module.model.layers.24.self_attn/aten::size/ShapeOf_10" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5869" name="Constant_302229" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5870" name="__module.model.layers.24.self_attn/aten::size/Constant_11" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="5871" name="__module.model.layers.24.self_attn/aten::size/Gather_11" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="4391"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5872" name="Constant_268716" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="795420624" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5873" name="Constant_277041" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795420632" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="5874" name="Constant_277042" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="5875" name="Gather_277043" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="5876" name="__module.model.layers.24.self_attn/prim::ListConstruct/Concat_5" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="4" precision="I64" names="4400"> + <dim>5</dim> + </port> + </output> + </layer> + <layer id="5877" name="__module.model.layers.24.self_attn/aten::expand/Broadcast_1" type="Broadcast" version="opset3"> + <data mode="bidirectional" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>5</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4401,hidden_states.735"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5878" name="Constant_301845" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420648" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5879" name="__module.model.layers.24.self_attn/aten::reshape/Reshape_1" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4405"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5880" name="__module.model.layers.24.self_attn/aten::slice/Reshape_60" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5881" name="ShapeOf_299644" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5882" name="Constant_299645" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694668" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5883" name="Constant_299646" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="5884" name="Gather_299647" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5885" name="ShapeOf_299648" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5886" name="Constant_299649" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694668" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5887" name="Constant_299650" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="5888" name="Gather_299651" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5889" name="Add_299652" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64" names="4406"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5890" name="__module.model.layers.24.self_attn/aten::slice/Reshape_62" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5891" name="__module.model.layers.24.self_attn/aten::slice/Reshape_63" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5892" name="__module.model.layers.24.self_attn/aten::slice/Slice_15" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="4410"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="5893" name="__module.model.layers.24.self_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> + <data causal="false" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="4411,attn_output.97"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5894" name="__module.model.layers.24.self_attn/aten::transpose/ScatterElementsUpdate_3" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5895" name="__module.model.layers.24.self_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4412"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5896" name="Constant_301846" type="Const" version="opset1"> + <data element_type="i64" shape="3" offset="798146608" size="24" /> + <output> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="5897" name="__module.model.layers.24.self_attn/aten::view/Reshape_3" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>3</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4415"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="5898" name="self.model.layers.24.self_attn.o_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 128" offset="4231512184" size="13107200" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5899" name="Convert_386517" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5900" name="self.model.layers.24.self_attn.o_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 1" offset="4244619384" size="102400" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5901" name="Convert_386519" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5902" name="self.model.layers.24.self_attn.o_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5903" name="self.model.layers.24.self_attn.o_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="5120, 40, 1" offset="4244721784" size="409600" /> + <output> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5904" name="self.model.layers.24.self_attn.o_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5905" name="Constant_386524" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="792684080" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="5906" name="Reshape_386525" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="5907" name="__module.model.layers.24.self_attn.o_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="5908" name="__module.model.layers.24.self_attn.o_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4417,4419,hidden_states.737"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="5909" name="__module.model.layers.24/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4422,4424,4435,hidden_states.739,hidden_states.741"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="5910" name="Constant_290297" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 5120" offset="4245131384" size="20480" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="5911" name="Constant_290296" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064860" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5912" name="Constant_290294" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064864" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5913" name="__module.model.layers.24.post_attention_layernorm/aten::pow/Power" type="Power" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4425"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="5914" name="Constant_17252" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64" names="4426"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5915" name="__module.model.layers.24.post_attention_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> + <data keep_dims="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4427,variance.99"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5916" name="Constant_290295" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064876" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5917" name="__module.model.layers.24.post_attention_layernorm/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4428"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5918" name="__module.model.layers.24.post_attention_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5919" name="__module.model.layers.24.post_attention_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4429"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5920" name="__module.model.layers.24.post_attention_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4430,4431,hidden_states.743,hidden_states.745"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="5921" name="__module.model.layers.24.post_attention_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4432,4434"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="5922" name="self.model.layers.24.mlp.gate_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 128" offset="4245151864" size="35389440" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5923" name="Convert_385317" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5924" name="self.model.layers.24.mlp.gate_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 1" offset="4280541304" size="276480" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5925" name="Convert_385319" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5926" name="self.model.layers.24.mlp.gate_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5927" name="self.model.layers.24.mlp.gate_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="13824, 40, 1" offset="4280817784" size="1105920" /> + <output> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5928" name="self.model.layers.24.mlp.gate_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5929" name="Constant_385324" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="848558152" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="5930" name="Reshape_385325" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="5931" name="__module.model.layers.24.mlp.gate_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="5932" name="__module.model.layers.24.mlp.gate_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4440,input.49"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="5933" name="__module.model.layers.24.mlp.act_fn/aten::silu/Swish" type="Swish" version="opset4"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="4441"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="5934" name="self.model.layers.24.mlp.up_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 128" offset="4281923704" size="35389440" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5935" name="Convert_385307" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5936" name="self.model.layers.24.mlp.up_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 1" offset="4317313144" size="276480" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5937" name="Convert_385309" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5938" name="self.model.layers.24.mlp.up_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5939" name="self.model.layers.24.mlp.up_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="13824, 40, 1" offset="4317589624" size="1105920" /> + <output> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5940" name="self.model.layers.24.mlp.up_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5941" name="Constant_385314" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="848558152" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="5942" name="Reshape_385315" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="5943" name="__module.model.layers.24.mlp.up_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="5944" name="__module.model.layers.24.mlp.up_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4443"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="5945" name="__module.model.layers.24.mlp/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4444"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="5946" name="self.model.layers.24.mlp.down_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 108, 128" offset="4318695544" size="35389440" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5947" name="Convert_385327" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5948" name="self.model.layers.24.mlp.down_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 108, 1" offset="4354084984" size="276480" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5949" name="Convert_385329" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5950" name="self.model.layers.24.mlp.down_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5951" name="self.model.layers.24.mlp.down_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="5120, 108, 1" offset="4354361464" size="1105920" /> + <output> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5952" name="self.model.layers.24.mlp.down_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5953" name="Constant_385334" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="922101848" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="5954" name="Reshape_385335" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="5955" name="__module.model.layers.24.mlp.down_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="5956" name="__module.model.layers.24.mlp.down_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4446,hidden_states.747"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="5957" name="__module.model.layers.24/aten::add/Add_1" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4447,4449,4457,4468,hidden_states.749,hidden_states.751"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="5958" name="Constant_290301" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 5120" offset="4355467384" size="20480" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="5959" name="Constant_290300" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064860" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5960" name="Constant_290298" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064864" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5961" name="__module.model.layers.25.input_layernorm/aten::pow/Power" type="Power" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4458"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="5962" name="Constant_17326" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64" names="4459"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5963" name="__module.model.layers.25.input_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> + <data keep_dims="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4460,variance.101"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5964" name="Constant_290299" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064876" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5965" name="__module.model.layers.25.input_layernorm/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4461"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5966" name="__module.model.layers.25.input_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5967" name="__module.model.layers.25.input_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4462"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5968" name="__module.model.layers.25.input_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4463,4464,hidden_states.753,hidden_states.755"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="5969" name="__module.model.layers.25.input_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4465,4467,hidden_states.757"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="5970" name="self.model.layers.25.self_attn.q_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 128" offset="4355487864" size="13107200" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5971" name="Convert_386527" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5972" name="self.model.layers.25.self_attn.q_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 1" offset="4368595064" size="102400" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5973" name="Convert_386529" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5974" name="self.model.layers.25.self_attn.q_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5975" name="self.model.layers.25.self_attn.q_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="5120, 40, 1" offset="4368697464" size="409600" /> + <output> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5976" name="self.model.layers.25.self_attn.q_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5977" name="Constant_386534" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="792684080" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="5978" name="Reshape_386535" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="5979" name="__module.model.layers.25.self_attn.q_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="5980" name="__module.model.layers.25.self_attn.q_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="5981" name="self.model.layers.25.self_attn.q_proj.bias" type="Const" version="opset1"> + <data element_type="bf16" shape="5120" offset="4369107064" size="10240" /> + <output> + <port id="0" precision="BF16" names="self.model.layers.25.self_attn.q_proj.bias"> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="5982" name="__module.model.layers.25.self_attn.q_proj/prim::PythonOp/ConvertLike_1" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="BF16"> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="5983" name="__module.model.layers.25.self_attn.q_proj/prim::PythonOp/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4477,query_states.51"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="5984" name="Constant_301847" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="792694336" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5985" name="__module.model.layers.25.self_attn/aten::view/Reshape" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4485"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5986" name="__module.model.layers.25.self_attn/aten::transpose/ScatterElementsUpdate" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5987" name="__module.model.layers.25.self_attn/aten::transpose/Transpose" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4486,q.51"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5988" name="__module.model.layers.25.self_attn/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4495"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="5989" name="__module.model.layers.25.self_attn/aten::size/ShapeOf_3" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="5990" name="__module.model.layers.25.self_attn/aten::size/Constant_3" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="5991" name="__module.model.layers.25.self_attn/aten::size/Gather_3" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="4496,4501" /> + </output> + </layer> + <layer id="5992" name="__module.model.layers.25.self_attn/aten::floor_divide/Divide_1" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" /> + </output> + </layer> + <layer id="5993" name="__module.model.layers.25.self_attn/aten::floor_divide/Floor_1" type="Floor" version="opset1"> + <input> + <port id="0" precision="I64" /> + </input> + <output> + <port id="1" precision="I64" names="4498,4499,4503,4504" /> + </output> + </layer> + <layer id="5994" name="Constant_220920" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5995" name="__module.model.layers.25.self_attn/aten::slice/Reshape_5" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5996" name="__module.model.layers.25.self_attn/aten::slice/Reshape_1" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694676" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5997" name="__module.model.layers.25.self_attn/aten::slice/Reshape_2" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5998" name="__module.model.layers.25.self_attn/aten::slice/Reshape_3" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="5999" name="__module.model.layers.25.self_attn/aten::slice/Slice" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="4505,x2.101"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="6000" name="Constant_290302" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1, 1" offset="792694684" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6001" name="__module.model.layers.25.self_attn/aten::neg/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4506"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="6002" name="__module.model.layers.25.self_attn/aten::slice/Reshape_4" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6003" name="__module.model.layers.25.self_attn/aten::slice/Reshape_6" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6004" name="__module.model.layers.25.self_attn/aten::slice/Reshape_7" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6005" name="__module.model.layers.25.self_attn/aten::slice/Slice_1" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="4500"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="6006" name="__module.model.layers.25.self_attn/aten::cat/Concat" type="Concat" version="opset1"> + <data axis="-1" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4508"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6007" name="__module.model.layers.25.self_attn/aten::mul/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4509"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6008" name="__module.model.layers.25.self_attn/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4510"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6009" name="Constant_341425" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="6010" name="Constant_341418" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="12" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6011" name="Constant_341420" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6012" name="Constant_341422" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="20" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6013" name="Concat_341423" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6014" name="Broadcast_341426" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32" /> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6015" name="ReadValue_333148" type="ReadValue" version="opset6"> + <data variable_id="past_key_values.25.keypresent.25.key" variable_type="f32" variable_shape="?,8,?,128" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="past_key_values.25.key"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6016" name="Constant_325459" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="6017" name="Gather_325460" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6018" name="self.model.layers.25.self_attn.k_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 128" offset="4369117304" size="2621440" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6019" name="Convert_387487" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6020" name="self.model.layers.25.self_attn.k_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 1" offset="4371738744" size="20480" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6021" name="Convert_387489" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6022" name="self.model.layers.25.self_attn.k_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6023" name="self.model.layers.25.self_attn.k_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="1024, 40, 1" offset="4371759224" size="81920" /> + <output> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6024" name="self.model.layers.25.self_attn.k_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6025" name="Constant_387494" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795418528" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="6026" name="Reshape_387495" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="6027" name="__module.model.layers.25.self_attn.k_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="6028" name="__module.model.layers.25.self_attn.k_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="6029" name="self.model.layers.25.self_attn.k_proj.bias" type="Const" version="opset1"> + <data element_type="bf16" shape="1024" offset="4371841144" size="2048" /> + <output> + <port id="0" precision="BF16" names="self.model.layers.25.self_attn.k_proj.bias"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="6030" name="__module.model.layers.25.self_attn.k_proj/prim::PythonOp/ConvertLike_1" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="BF16"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="6031" name="__module.model.layers.25.self_attn.k_proj/prim::PythonOp/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4480,key_states.105"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="6032" name="Constant_301848" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420592" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6033" name="__module.model.layers.25.self_attn/aten::view/Reshape_1" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4488"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6034" name="__module.model.layers.25.self_attn/aten::transpose/ScatterElementsUpdate_1" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6035" name="__module.model.layers.25.self_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4489,k.51"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6036" name="__module.model.layers.25.self_attn/aten::mul/Multiply_2" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4511"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6037" name="__module.model.layers.25.self_attn/aten::size/ShapeOf_5" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6038" name="__module.model.layers.25.self_attn/aten::size/Constant_5" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="6039" name="__module.model.layers.25.self_attn/aten::size/Gather_5" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="4512,4517" /> + </output> + </layer> + <layer id="6040" name="__module.model.layers.25.self_attn/aten::floor_divide/Divide_3" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" /> + </output> + </layer> + <layer id="6041" name="__module.model.layers.25.self_attn/aten::floor_divide/Floor_3" type="Floor" version="opset1"> + <input> + <port id="0" precision="I64" /> + </input> + <output> + <port id="1" precision="I64" names="4514,4515,4519,4520" /> + </output> + </layer> + <layer id="6042" name="Constant_220921" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6043" name="__module.model.layers.25.self_attn/aten::slice/Reshape_13" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6044" name="__module.model.layers.25.self_attn/aten::slice/Reshape_9" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694676" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6045" name="__module.model.layers.25.self_attn/aten::slice/Reshape_10" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6046" name="__module.model.layers.25.self_attn/aten::slice/Reshape_11" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6047" name="__module.model.layers.25.self_attn/aten::slice/Slice_2" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="4521,x2.103"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="6048" name="Constant_290303" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1, 1" offset="792694684" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6049" name="__module.model.layers.25.self_attn/aten::neg/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4522"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="6050" name="__module.model.layers.25.self_attn/aten::slice/Reshape_12" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6051" name="__module.model.layers.25.self_attn/aten::slice/Reshape_14" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6052" name="__module.model.layers.25.self_attn/aten::slice/Reshape_15" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6053" name="__module.model.layers.25.self_attn/aten::slice/Slice_3" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="4516"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="6054" name="__module.model.layers.25.self_attn/aten::cat/Concat_1" type="Concat" version="opset1"> + <data axis="-1" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4524"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6055" name="__module.model.layers.25.self_attn/aten::mul/Multiply_3" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4525"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6056" name="__module.model.layers.25.self_attn/aten::add/Add_1" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4526"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6057" name="__module.model.layers.25.self_attn/aten::cat/Concat_2" type="Concat" version="opset1"> + <data axis="-2" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="present.25.key"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6058" name="__module.model.layers.25.self_attn/aten::unsqueeze/Unsqueeze_2" type="Unsqueeze" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="FP32" names="4538,4539,4540"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6059" name="__module.model.layers.25.self_attn/aten::size/ShapeOf_6" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6060" name="Constant_302489" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="938477672" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="6061" name="Constant_302490" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="6062" name="Gather_302491" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="6063" name="Constant_268734" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="795420624" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6064" name="Constant_277066" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795420632" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="6065" name="Constant_277067" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="6066" name="Gather_277068" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="6067" name="__module.model.layers.25.self_attn/prim::ListConstruct/Concat_2" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="3" precision="I64" names="4541"> + <dim>5</dim> + </port> + </output> + </layer> + <layer id="6068" name="__module.model.layers.25.self_attn/aten::expand/Broadcast" type="Broadcast" version="opset3"> + <data mode="bidirectional" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>5</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4542,hidden_states.761"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6069" name="Constant_301849" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420648" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6070" name="__module.model.layers.25.self_attn/aten::reshape/Reshape" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4546,key_states.107"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6071" name="Constant_341438" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="6072" name="Constant_341431" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="12" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6073" name="Constant_341433" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6074" name="Constant_341435" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="20" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6075" name="Concat_341436" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6076" name="Broadcast_341439" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32" /> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6077" name="ReadValue_333150" type="ReadValue" version="opset6"> + <data variable_id="past_key_values.25.valuepresent.25.value" variable_type="f32" variable_shape="?,8,?,128" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="past_key_values.25.value"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6078" name="Constant_325462" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="6079" name="Gather_325463" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6080" name="self.model.layers.25.self_attn.v_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 128" offset="4371843192" size="2621440" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6081" name="Convert_387497" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6082" name="self.model.layers.25.self_attn.v_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 1" offset="4374464632" size="20480" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6083" name="Convert_387499" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6084" name="self.model.layers.25.self_attn.v_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6085" name="self.model.layers.25.self_attn.v_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="1024, 40, 1" offset="4374485112" size="81920" /> + <output> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6086" name="self.model.layers.25.self_attn.v_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6087" name="Constant_387504" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795418528" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="6088" name="Reshape_387505" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="6089" name="__module.model.layers.25.self_attn.v_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="6090" name="__module.model.layers.25.self_attn.v_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="6091" name="self.model.layers.25.self_attn.v_proj.bias" type="Const" version="opset1"> + <data element_type="bf16" shape="1024" offset="4374567032" size="2048" /> + <output> + <port id="0" precision="BF16" names="self.model.layers.25.self_attn.v_proj.bias"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="6092" name="__module.model.layers.25.self_attn.v_proj/prim::PythonOp/ConvertLike_1" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="BF16"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="6093" name="__module.model.layers.25.self_attn.v_proj/prim::PythonOp/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4483,value_states.51"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="6094" name="Constant_301850" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420592" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6095" name="__module.model.layers.25.self_attn/aten::view/Reshape_2" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4491"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6096" name="__module.model.layers.25.self_attn/aten::transpose/ScatterElementsUpdate_2" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6097" name="__module.model.layers.25.self_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4492"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6098" name="__module.model.layers.25.self_attn/aten::cat/Concat_3" type="Concat" version="opset1"> + <data axis="-2" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="present.25.value"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6099" name="__module.model.layers.25.self_attn/aten::unsqueeze/Unsqueeze_3" type="Unsqueeze" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="FP32" names="4554,4555,4556"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6100" name="__module.model.layers.25.self_attn/aten::size/ShapeOf_10" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6101" name="Constant_302235" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6102" name="__module.model.layers.25.self_attn/aten::size/Constant_11" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="6103" name="__module.model.layers.25.self_attn/aten::size/Gather_11" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="4548"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6104" name="Constant_268752" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="795420624" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6105" name="Constant_277076" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795420632" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="6106" name="Constant_277077" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="6107" name="Gather_277078" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="6108" name="__module.model.layers.25.self_attn/prim::ListConstruct/Concat_5" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="4" precision="I64" names="4557"> + <dim>5</dim> + </port> + </output> + </layer> + <layer id="6109" name="__module.model.layers.25.self_attn/aten::expand/Broadcast_1" type="Broadcast" version="opset3"> + <data mode="bidirectional" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>5</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4558,hidden_states.765"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6110" name="Constant_301851" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420648" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6111" name="__module.model.layers.25.self_attn/aten::reshape/Reshape_1" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4562"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6112" name="__module.model.layers.25.self_attn/aten::slice/Reshape_60" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6113" name="ShapeOf_299730" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6114" name="Constant_299731" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694668" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6115" name="Constant_299732" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="6116" name="Gather_299733" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6117" name="ShapeOf_299734" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6118" name="Constant_299735" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694668" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6119" name="Constant_299736" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="6120" name="Gather_299737" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6121" name="Add_299738" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64" names="4563"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6122" name="__module.model.layers.25.self_attn/aten::slice/Reshape_62" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6123" name="__module.model.layers.25.self_attn/aten::slice/Reshape_63" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6124" name="__module.model.layers.25.self_attn/aten::slice/Slice_15" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="4567"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="6125" name="__module.model.layers.25.self_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> + <data causal="false" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="4568,attn_output.101"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6126" name="__module.model.layers.25.self_attn/aten::transpose/ScatterElementsUpdate_3" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6127" name="__module.model.layers.25.self_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4569"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6128" name="Constant_301852" type="Const" version="opset1"> + <data element_type="i64" shape="3" offset="798146608" size="24" /> + <output> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="6129" name="__module.model.layers.25.self_attn/aten::view/Reshape_3" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>3</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4572"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="6130" name="self.model.layers.25.self_attn.o_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 128" offset="4374569080" size="13107200" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6131" name="Convert_386537" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6132" name="self.model.layers.25.self_attn.o_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 1" offset="4387676280" size="102400" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6133" name="Convert_386539" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6134" name="self.model.layers.25.self_attn.o_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6135" name="self.model.layers.25.self_attn.o_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="5120, 40, 1" offset="4387778680" size="409600" /> + <output> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6136" name="self.model.layers.25.self_attn.o_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6137" name="Constant_386544" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="792684080" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="6138" name="Reshape_386545" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="6139" name="__module.model.layers.25.self_attn.o_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="6140" name="__module.model.layers.25.self_attn.o_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4574,4576,hidden_states.767"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="6141" name="__module.model.layers.25/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4579,4581,4592,hidden_states.769,hidden_states.771"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="6142" name="Constant_290307" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 5120" offset="4388188280" size="20480" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="6143" name="Constant_290306" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064860" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6144" name="Constant_290304" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064864" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6145" name="__module.model.layers.25.post_attention_layernorm/aten::pow/Power" type="Power" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4582"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="6146" name="Constant_17924" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64" names="4583"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6147" name="__module.model.layers.25.post_attention_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> + <data keep_dims="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4584,variance.103"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6148" name="Constant_290305" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064876" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6149" name="__module.model.layers.25.post_attention_layernorm/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4585"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6150" name="__module.model.layers.25.post_attention_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6151" name="__module.model.layers.25.post_attention_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4586"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6152" name="__module.model.layers.25.post_attention_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4587,4588,hidden_states.773,hidden_states.775"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="6153" name="__module.model.layers.25.post_attention_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4589,4591"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="6154" name="self.model.layers.25.mlp.gate_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 128" offset="4388208760" size="35389440" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6155" name="Convert_385347" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6156" name="self.model.layers.25.mlp.gate_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 1" offset="4423598200" size="276480" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6157" name="Convert_385349" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6158" name="self.model.layers.25.mlp.gate_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6159" name="self.model.layers.25.mlp.gate_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="13824, 40, 1" offset="4423874680" size="1105920" /> + <output> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6160" name="self.model.layers.25.mlp.gate_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6161" name="Constant_385354" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="848558152" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="6162" name="Reshape_385355" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="6163" name="__module.model.layers.25.mlp.gate_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="6164" name="__module.model.layers.25.mlp.gate_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4597,input.51"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="6165" name="__module.model.layers.25.mlp.act_fn/aten::silu/Swish" type="Swish" version="opset4"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="4598"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="6166" name="self.model.layers.25.mlp.up_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 128" offset="4424980600" size="35389440" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6167" name="Convert_385337" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6168" name="self.model.layers.25.mlp.up_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 1" offset="4460370040" size="276480" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6169" name="Convert_385339" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6170" name="self.model.layers.25.mlp.up_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6171" name="self.model.layers.25.mlp.up_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="13824, 40, 1" offset="4460646520" size="1105920" /> + <output> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6172" name="self.model.layers.25.mlp.up_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6173" name="Constant_385344" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="848558152" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="6174" name="Reshape_385345" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="6175" name="__module.model.layers.25.mlp.up_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="6176" name="__module.model.layers.25.mlp.up_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4600"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="6177" name="__module.model.layers.25.mlp/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4601"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="6178" name="self.model.layers.25.mlp.down_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 108, 128" offset="4461752440" size="35389440" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6179" name="Convert_385357" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6180" name="self.model.layers.25.mlp.down_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 108, 1" offset="4497141880" size="276480" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6181" name="Convert_385359" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6182" name="self.model.layers.25.mlp.down_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6183" name="self.model.layers.25.mlp.down_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="5120, 108, 1" offset="4497418360" size="1105920" /> + <output> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6184" name="self.model.layers.25.mlp.down_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6185" name="Constant_385364" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="922101848" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="6186" name="Reshape_385365" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="6187" name="__module.model.layers.25.mlp.down_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="6188" name="__module.model.layers.25.mlp.down_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4603,hidden_states.777"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="6189" name="__module.model.layers.25/aten::add/Add_1" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4604,4606,4614,4625,hidden_states.779,hidden_states.781"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="6190" name="Constant_290311" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 5120" offset="4498524280" size="20480" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="6191" name="Constant_290310" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064860" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6192" name="Constant_290308" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064864" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6193" name="__module.model.layers.26.input_layernorm/aten::pow/Power" type="Power" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4615"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="6194" name="Constant_17998" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64" names="4616"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6195" name="__module.model.layers.26.input_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> + <data keep_dims="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4617,variance.105"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6196" name="Constant_290309" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064876" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6197" name="__module.model.layers.26.input_layernorm/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4618"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6198" name="__module.model.layers.26.input_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6199" name="__module.model.layers.26.input_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4619"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6200" name="__module.model.layers.26.input_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4620,4621,hidden_states.783,hidden_states.785"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="6201" name="__module.model.layers.26.input_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4622,4624,hidden_states.787"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="6202" name="self.model.layers.26.self_attn.q_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 128" offset="4498544760" size="13107200" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6203" name="Convert_386547" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6204" name="self.model.layers.26.self_attn.q_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 1" offset="4511651960" size="102400" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6205" name="Convert_386549" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6206" name="self.model.layers.26.self_attn.q_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6207" name="self.model.layers.26.self_attn.q_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="5120, 40, 1" offset="4511754360" size="409600" /> + <output> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6208" name="self.model.layers.26.self_attn.q_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6209" name="Constant_386554" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="792684080" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="6210" name="Reshape_386555" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="6211" name="__module.model.layers.26.self_attn.q_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="6212" name="__module.model.layers.26.self_attn.q_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="6213" name="self.model.layers.26.self_attn.q_proj.bias" type="Const" version="opset1"> + <data element_type="bf16" shape="5120" offset="4512163960" size="10240" /> + <output> + <port id="0" precision="BF16" names="self.model.layers.26.self_attn.q_proj.bias"> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="6214" name="__module.model.layers.26.self_attn.q_proj/prim::PythonOp/ConvertLike_1" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="BF16"> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="6215" name="__module.model.layers.26.self_attn.q_proj/prim::PythonOp/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4634,query_states.53"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="6216" name="Constant_301853" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="792694336" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6217" name="__module.model.layers.26.self_attn/aten::view/Reshape" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4642"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6218" name="__module.model.layers.26.self_attn/aten::transpose/ScatterElementsUpdate" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6219" name="__module.model.layers.26.self_attn/aten::transpose/Transpose" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4643,q.53"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6220" name="__module.model.layers.26.self_attn/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4652"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6221" name="__module.model.layers.26.self_attn/aten::size/ShapeOf_3" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6222" name="__module.model.layers.26.self_attn/aten::size/Constant_3" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="6223" name="__module.model.layers.26.self_attn/aten::size/Gather_3" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="4653,4658" /> + </output> + </layer> + <layer id="6224" name="__module.model.layers.26.self_attn/aten::floor_divide/Divide_1" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" /> + </output> + </layer> + <layer id="6225" name="__module.model.layers.26.self_attn/aten::floor_divide/Floor_1" type="Floor" version="opset1"> + <input> + <port id="0" precision="I64" /> + </input> + <output> + <port id="1" precision="I64" names="4655,4656,4660,4661" /> + </output> + </layer> + <layer id="6226" name="Constant_220935" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6227" name="__module.model.layers.26.self_attn/aten::slice/Reshape_5" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6228" name="__module.model.layers.26.self_attn/aten::slice/Reshape_1" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694676" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6229" name="__module.model.layers.26.self_attn/aten::slice/Reshape_2" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6230" name="__module.model.layers.26.self_attn/aten::slice/Reshape_3" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6231" name="__module.model.layers.26.self_attn/aten::slice/Slice" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="4662,x2.105"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="6232" name="Constant_290312" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1, 1" offset="792694684" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6233" name="__module.model.layers.26.self_attn/aten::neg/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4663"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="6234" name="__module.model.layers.26.self_attn/aten::slice/Reshape_4" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6235" name="__module.model.layers.26.self_attn/aten::slice/Reshape_6" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6236" name="__module.model.layers.26.self_attn/aten::slice/Reshape_7" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6237" name="__module.model.layers.26.self_attn/aten::slice/Slice_1" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="4657"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="6238" name="__module.model.layers.26.self_attn/aten::cat/Concat" type="Concat" version="opset1"> + <data axis="-1" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4665"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6239" name="__module.model.layers.26.self_attn/aten::mul/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4666"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6240" name="__module.model.layers.26.self_attn/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4667"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6241" name="Constant_341451" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="6242" name="Constant_341444" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="12" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6243" name="Constant_341446" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6244" name="Constant_341448" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="20" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6245" name="Concat_341449" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6246" name="Broadcast_341452" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32" /> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6247" name="ReadValue_333152" type="ReadValue" version="opset6"> + <data variable_id="past_key_values.26.keypresent.26.key" variable_type="f32" variable_shape="?,8,?,128" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="past_key_values.26.key"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6248" name="Constant_325465" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="6249" name="Gather_325466" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6250" name="self.model.layers.26.self_attn.k_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 128" offset="4512174200" size="2621440" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6251" name="Convert_387507" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6252" name="self.model.layers.26.self_attn.k_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 1" offset="4514795640" size="20480" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6253" name="Convert_387509" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6254" name="self.model.layers.26.self_attn.k_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6255" name="self.model.layers.26.self_attn.k_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="1024, 40, 1" offset="4514816120" size="81920" /> + <output> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6256" name="self.model.layers.26.self_attn.k_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6257" name="Constant_387514" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795418528" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="6258" name="Reshape_387515" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="6259" name="__module.model.layers.26.self_attn.k_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="6260" name="__module.model.layers.26.self_attn.k_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="6261" name="self.model.layers.26.self_attn.k_proj.bias" type="Const" version="opset1"> + <data element_type="bf16" shape="1024" offset="4514898040" size="2048" /> + <output> + <port id="0" precision="BF16" names="self.model.layers.26.self_attn.k_proj.bias"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="6262" name="__module.model.layers.26.self_attn.k_proj/prim::PythonOp/ConvertLike_1" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="BF16"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="6263" name="__module.model.layers.26.self_attn.k_proj/prim::PythonOp/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4637,key_states.109"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="6264" name="Constant_301854" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420592" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6265" name="__module.model.layers.26.self_attn/aten::view/Reshape_1" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4645"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6266" name="__module.model.layers.26.self_attn/aten::transpose/ScatterElementsUpdate_1" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6267" name="__module.model.layers.26.self_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4646,k.53"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6268" name="__module.model.layers.26.self_attn/aten::mul/Multiply_2" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4668"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6269" name="__module.model.layers.26.self_attn/aten::size/ShapeOf_5" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6270" name="__module.model.layers.26.self_attn/aten::size/Constant_5" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="6271" name="__module.model.layers.26.self_attn/aten::size/Gather_5" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="4669,4674" /> + </output> + </layer> + <layer id="6272" name="__module.model.layers.26.self_attn/aten::floor_divide/Divide_3" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" /> + </output> + </layer> + <layer id="6273" name="__module.model.layers.26.self_attn/aten::floor_divide/Floor_3" type="Floor" version="opset1"> + <input> + <port id="0" precision="I64" /> + </input> + <output> + <port id="1" precision="I64" names="4671,4672,4676,4677" /> + </output> + </layer> + <layer id="6274" name="Constant_220936" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6275" name="__module.model.layers.26.self_attn/aten::slice/Reshape_13" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6276" name="__module.model.layers.26.self_attn/aten::slice/Reshape_9" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694676" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6277" name="__module.model.layers.26.self_attn/aten::slice/Reshape_10" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6278" name="__module.model.layers.26.self_attn/aten::slice/Reshape_11" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6279" name="__module.model.layers.26.self_attn/aten::slice/Slice_2" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="4678,x2.107"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="6280" name="Constant_290313" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1, 1" offset="792694684" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6281" name="__module.model.layers.26.self_attn/aten::neg/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4679"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="6282" name="__module.model.layers.26.self_attn/aten::slice/Reshape_12" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6283" name="__module.model.layers.26.self_attn/aten::slice/Reshape_14" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6284" name="__module.model.layers.26.self_attn/aten::slice/Reshape_15" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6285" name="__module.model.layers.26.self_attn/aten::slice/Slice_3" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="4673"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="6286" name="__module.model.layers.26.self_attn/aten::cat/Concat_1" type="Concat" version="opset1"> + <data axis="-1" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4681"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6287" name="__module.model.layers.26.self_attn/aten::mul/Multiply_3" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4682"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6288" name="__module.model.layers.26.self_attn/aten::add/Add_1" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4683"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6289" name="__module.model.layers.26.self_attn/aten::cat/Concat_2" type="Concat" version="opset1"> + <data axis="-2" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="present.26.key"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6290" name="__module.model.layers.26.self_attn/aten::unsqueeze/Unsqueeze_2" type="Unsqueeze" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="FP32" names="4695,4696,4697"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6291" name="__module.model.layers.26.self_attn/aten::size/ShapeOf_6" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6292" name="Constant_302494" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="938477672" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="6293" name="Constant_302495" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="6294" name="Gather_302496" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="6295" name="Constant_268770" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="795420624" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6296" name="Constant_277101" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795420632" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="6297" name="Constant_277102" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="6298" name="Gather_277103" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="6299" name="__module.model.layers.26.self_attn/prim::ListConstruct/Concat_2" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="3" precision="I64" names="4698"> + <dim>5</dim> + </port> + </output> + </layer> + <layer id="6300" name="__module.model.layers.26.self_attn/aten::expand/Broadcast" type="Broadcast" version="opset3"> + <data mode="bidirectional" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>5</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4699,hidden_states.791"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6301" name="Constant_301855" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420648" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6302" name="__module.model.layers.26.self_attn/aten::reshape/Reshape" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4703,key_states.111"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6303" name="Constant_341464" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="6304" name="Constant_341457" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="12" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6305" name="Constant_341459" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6306" name="Constant_341461" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="20" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6307" name="Concat_341462" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6308" name="Broadcast_341465" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32" /> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6309" name="ReadValue_333154" type="ReadValue" version="opset6"> + <data variable_id="past_key_values.26.valuepresent.26.value" variable_type="f32" variable_shape="?,8,?,128" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="past_key_values.26.value"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6310" name="Constant_325468" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="6311" name="Gather_325469" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6312" name="self.model.layers.26.self_attn.v_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 128" offset="4514900088" size="2621440" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6313" name="Convert_387517" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6314" name="self.model.layers.26.self_attn.v_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 1" offset="4517521528" size="20480" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6315" name="Convert_387519" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6316" name="self.model.layers.26.self_attn.v_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6317" name="self.model.layers.26.self_attn.v_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="1024, 40, 1" offset="4517542008" size="81920" /> + <output> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6318" name="self.model.layers.26.self_attn.v_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6319" name="Constant_387524" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795418528" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="6320" name="Reshape_387525" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="6321" name="__module.model.layers.26.self_attn.v_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="6322" name="__module.model.layers.26.self_attn.v_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="6323" name="self.model.layers.26.self_attn.v_proj.bias" type="Const" version="opset1"> + <data element_type="bf16" shape="1024" offset="4517623928" size="2048" /> + <output> + <port id="0" precision="BF16" names="self.model.layers.26.self_attn.v_proj.bias"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="6324" name="__module.model.layers.26.self_attn.v_proj/prim::PythonOp/ConvertLike_1" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="BF16"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="6325" name="__module.model.layers.26.self_attn.v_proj/prim::PythonOp/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4640,value_states.53"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="6326" name="Constant_301856" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420592" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6327" name="__module.model.layers.26.self_attn/aten::view/Reshape_2" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4648"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6328" name="__module.model.layers.26.self_attn/aten::transpose/ScatterElementsUpdate_2" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6329" name="__module.model.layers.26.self_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4649"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6330" name="__module.model.layers.26.self_attn/aten::cat/Concat_3" type="Concat" version="opset1"> + <data axis="-2" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="present.26.value"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6331" name="__module.model.layers.26.self_attn/aten::unsqueeze/Unsqueeze_3" type="Unsqueeze" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="FP32" names="4711,4712,4713"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6332" name="__module.model.layers.26.self_attn/aten::size/ShapeOf_10" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6333" name="Constant_302241" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6334" name="__module.model.layers.26.self_attn/aten::size/Constant_11" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="6335" name="__module.model.layers.26.self_attn/aten::size/Gather_11" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="4705"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6336" name="Constant_268788" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="795420624" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6337" name="Constant_277111" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795420632" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="6338" name="Constant_277112" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="6339" name="Gather_277113" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="6340" name="__module.model.layers.26.self_attn/prim::ListConstruct/Concat_5" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="4" precision="I64" names="4714"> + <dim>5</dim> + </port> + </output> + </layer> + <layer id="6341" name="__module.model.layers.26.self_attn/aten::expand/Broadcast_1" type="Broadcast" version="opset3"> + <data mode="bidirectional" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>5</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4715,hidden_states.795"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6342" name="Constant_301857" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420648" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6343" name="__module.model.layers.26.self_attn/aten::reshape/Reshape_1" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4719"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6344" name="__module.model.layers.26.self_attn/aten::slice/Reshape_60" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6345" name="ShapeOf_299816" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6346" name="Constant_299817" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694668" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6347" name="Constant_299818" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="6348" name="Gather_299819" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6349" name="ShapeOf_299820" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6350" name="Constant_299821" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694668" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6351" name="Constant_299822" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="6352" name="Gather_299823" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6353" name="Add_299824" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64" names="4720"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6354" name="__module.model.layers.26.self_attn/aten::slice/Reshape_62" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6355" name="__module.model.layers.26.self_attn/aten::slice/Reshape_63" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6356" name="__module.model.layers.26.self_attn/aten::slice/Slice_15" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="4724"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="6357" name="__module.model.layers.26.self_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> + <data causal="false" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="4725,attn_output.105"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6358" name="__module.model.layers.26.self_attn/aten::transpose/ScatterElementsUpdate_3" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6359" name="__module.model.layers.26.self_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4726"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6360" name="Constant_301858" type="Const" version="opset1"> + <data element_type="i64" shape="3" offset="798146608" size="24" /> + <output> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="6361" name="__module.model.layers.26.self_attn/aten::view/Reshape_3" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>3</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4729"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="6362" name="self.model.layers.26.self_attn.o_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 128" offset="4517625976" size="13107200" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6363" name="Convert_386557" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6364" name="self.model.layers.26.self_attn.o_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 1" offset="4530733176" size="102400" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6365" name="Convert_386559" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6366" name="self.model.layers.26.self_attn.o_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6367" name="self.model.layers.26.self_attn.o_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="5120, 40, 1" offset="4530835576" size="409600" /> + <output> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6368" name="self.model.layers.26.self_attn.o_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6369" name="Constant_386564" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="792684080" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="6370" name="Reshape_386565" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="6371" name="__module.model.layers.26.self_attn.o_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="6372" name="__module.model.layers.26.self_attn.o_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4731,4733,hidden_states.797"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="6373" name="__module.model.layers.26/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4736,4738,4749,hidden_states.799,hidden_states.801"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="6374" name="Constant_290317" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 5120" offset="4531245176" size="20480" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="6375" name="Constant_290316" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064860" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6376" name="Constant_290314" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064864" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6377" name="__module.model.layers.26.post_attention_layernorm/aten::pow/Power" type="Power" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4739"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="6378" name="Constant_18596" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64" names="4740"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6379" name="__module.model.layers.26.post_attention_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> + <data keep_dims="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4741,variance.107"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6380" name="Constant_290315" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064876" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6381" name="__module.model.layers.26.post_attention_layernorm/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4742"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6382" name="__module.model.layers.26.post_attention_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6383" name="__module.model.layers.26.post_attention_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4743"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6384" name="__module.model.layers.26.post_attention_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4744,4745,hidden_states.803,hidden_states.805"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="6385" name="__module.model.layers.26.post_attention_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4746,4748"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="6386" name="self.model.layers.26.mlp.gate_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 128" offset="4531265656" size="35389440" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6387" name="Convert_385377" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6388" name="self.model.layers.26.mlp.gate_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 1" offset="4566655096" size="276480" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6389" name="Convert_385379" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6390" name="self.model.layers.26.mlp.gate_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6391" name="self.model.layers.26.mlp.gate_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="13824, 40, 1" offset="4566931576" size="1105920" /> + <output> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6392" name="self.model.layers.26.mlp.gate_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6393" name="Constant_385384" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="848558152" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="6394" name="Reshape_385385" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="6395" name="__module.model.layers.26.mlp.gate_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="6396" name="__module.model.layers.26.mlp.gate_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4754,input.53"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="6397" name="__module.model.layers.26.mlp.act_fn/aten::silu/Swish" type="Swish" version="opset4"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="4755"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="6398" name="self.model.layers.26.mlp.up_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 128" offset="4568037496" size="35389440" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6399" name="Convert_385367" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6400" name="self.model.layers.26.mlp.up_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 1" offset="4603426936" size="276480" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6401" name="Convert_385369" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6402" name="self.model.layers.26.mlp.up_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6403" name="self.model.layers.26.mlp.up_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="13824, 40, 1" offset="4603703416" size="1105920" /> + <output> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6404" name="self.model.layers.26.mlp.up_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6405" name="Constant_385374" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="848558152" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="6406" name="Reshape_385375" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="6407" name="__module.model.layers.26.mlp.up_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="6408" name="__module.model.layers.26.mlp.up_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4757"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="6409" name="__module.model.layers.26.mlp/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4758"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="6410" name="self.model.layers.26.mlp.down_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 108, 128" offset="4604809336" size="35389440" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6411" name="Convert_385387" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6412" name="self.model.layers.26.mlp.down_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 108, 1" offset="4640198776" size="276480" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6413" name="Convert_385389" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6414" name="self.model.layers.26.mlp.down_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6415" name="self.model.layers.26.mlp.down_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="5120, 108, 1" offset="4640475256" size="1105920" /> + <output> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6416" name="self.model.layers.26.mlp.down_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6417" name="Constant_385394" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="922101848" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="6418" name="Reshape_385395" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="6419" name="__module.model.layers.26.mlp.down_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="6420" name="__module.model.layers.26.mlp.down_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4760,hidden_states.807"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="6421" name="__module.model.layers.26/aten::add/Add_1" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4761,4763,4771,4782,hidden_states.809,hidden_states.811"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="6422" name="Constant_290321" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 5120" offset="4641581176" size="20480" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="6423" name="Constant_290320" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064860" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6424" name="Constant_290318" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064864" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6425" name="__module.model.layers.27.input_layernorm/aten::pow/Power" type="Power" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4772"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="6426" name="Constant_18670" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64" names="4773"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6427" name="__module.model.layers.27.input_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> + <data keep_dims="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4774,variance.109"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6428" name="Constant_290319" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064876" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6429" name="__module.model.layers.27.input_layernorm/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4775"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6430" name="__module.model.layers.27.input_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6431" name="__module.model.layers.27.input_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4776"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6432" name="__module.model.layers.27.input_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4777,4778,hidden_states.813,hidden_states.815"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="6433" name="__module.model.layers.27.input_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4779,4781,hidden_states.817"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="6434" name="self.model.layers.27.self_attn.q_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 128" offset="4641601656" size="13107200" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6435" name="Convert_386567" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6436" name="self.model.layers.27.self_attn.q_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 1" offset="4654708856" size="102400" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6437" name="Convert_386569" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6438" name="self.model.layers.27.self_attn.q_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6439" name="self.model.layers.27.self_attn.q_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="5120, 40, 1" offset="4654811256" size="409600" /> + <output> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6440" name="self.model.layers.27.self_attn.q_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6441" name="Constant_386574" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="792684080" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="6442" name="Reshape_386575" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="6443" name="__module.model.layers.27.self_attn.q_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="6444" name="__module.model.layers.27.self_attn.q_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="6445" name="self.model.layers.27.self_attn.q_proj.bias" type="Const" version="opset1"> + <data element_type="bf16" shape="5120" offset="4655220856" size="10240" /> + <output> + <port id="0" precision="BF16" names="self.model.layers.27.self_attn.q_proj.bias"> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="6446" name="__module.model.layers.27.self_attn.q_proj/prim::PythonOp/ConvertLike_1" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="BF16"> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="6447" name="__module.model.layers.27.self_attn.q_proj/prim::PythonOp/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4791,query_states.55"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="6448" name="Constant_301859" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="792694336" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6449" name="__module.model.layers.27.self_attn/aten::view/Reshape" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4799"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6450" name="__module.model.layers.27.self_attn/aten::transpose/ScatterElementsUpdate" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6451" name="__module.model.layers.27.self_attn/aten::transpose/Transpose" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4800,q.55"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6452" name="__module.model.layers.27.self_attn/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4809"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6453" name="__module.model.layers.27.self_attn/aten::size/ShapeOf_3" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6454" name="__module.model.layers.27.self_attn/aten::size/Constant_3" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="6455" name="__module.model.layers.27.self_attn/aten::size/Gather_3" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="4810,4815" /> + </output> + </layer> + <layer id="6456" name="__module.model.layers.27.self_attn/aten::floor_divide/Divide_1" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" /> + </output> + </layer> + <layer id="6457" name="__module.model.layers.27.self_attn/aten::floor_divide/Floor_1" type="Floor" version="opset1"> + <input> + <port id="0" precision="I64" /> + </input> + <output> + <port id="1" precision="I64" names="4812,4813,4817,4818" /> + </output> + </layer> + <layer id="6458" name="Constant_220950" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6459" name="__module.model.layers.27.self_attn/aten::slice/Reshape_5" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6460" name="__module.model.layers.27.self_attn/aten::slice/Reshape_1" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694676" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6461" name="__module.model.layers.27.self_attn/aten::slice/Reshape_2" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6462" name="__module.model.layers.27.self_attn/aten::slice/Reshape_3" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6463" name="__module.model.layers.27.self_attn/aten::slice/Slice" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="4819,x2.109"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="6464" name="Constant_290322" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1, 1" offset="792694684" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6465" name="__module.model.layers.27.self_attn/aten::neg/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4820"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="6466" name="__module.model.layers.27.self_attn/aten::slice/Reshape_4" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6467" name="__module.model.layers.27.self_attn/aten::slice/Reshape_6" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6468" name="__module.model.layers.27.self_attn/aten::slice/Reshape_7" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6469" name="__module.model.layers.27.self_attn/aten::slice/Slice_1" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="4814"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="6470" name="__module.model.layers.27.self_attn/aten::cat/Concat" type="Concat" version="opset1"> + <data axis="-1" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4822"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6471" name="__module.model.layers.27.self_attn/aten::mul/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4823"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6472" name="__module.model.layers.27.self_attn/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4824"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6473" name="Constant_341477" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="6474" name="Constant_341470" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="12" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6475" name="Constant_341472" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6476" name="Constant_341474" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="20" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6477" name="Concat_341475" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6478" name="Broadcast_341478" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32" /> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6479" name="ReadValue_333156" type="ReadValue" version="opset6"> + <data variable_id="past_key_values.27.keypresent.27.key" variable_type="f32" variable_shape="?,8,?,128" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="past_key_values.27.key"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6480" name="Constant_325471" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="6481" name="Gather_325472" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6482" name="self.model.layers.27.self_attn.k_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 128" offset="4655231096" size="2621440" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6483" name="Convert_387527" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6484" name="self.model.layers.27.self_attn.k_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 1" offset="4657852536" size="20480" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6485" name="Convert_387529" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6486" name="self.model.layers.27.self_attn.k_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6487" name="self.model.layers.27.self_attn.k_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="1024, 40, 1" offset="4657873016" size="81920" /> + <output> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6488" name="self.model.layers.27.self_attn.k_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6489" name="Constant_387534" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795418528" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="6490" name="Reshape_387535" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="6491" name="__module.model.layers.27.self_attn.k_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="6492" name="__module.model.layers.27.self_attn.k_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="6493" name="self.model.layers.27.self_attn.k_proj.bias" type="Const" version="opset1"> + <data element_type="bf16" shape="1024" offset="4657954936" size="2048" /> + <output> + <port id="0" precision="BF16" names="self.model.layers.27.self_attn.k_proj.bias"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="6494" name="__module.model.layers.27.self_attn.k_proj/prim::PythonOp/ConvertLike_1" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="BF16"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="6495" name="__module.model.layers.27.self_attn.k_proj/prim::PythonOp/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4794,key_states.113"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="6496" name="Constant_301860" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420592" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6497" name="__module.model.layers.27.self_attn/aten::view/Reshape_1" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4802"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6498" name="__module.model.layers.27.self_attn/aten::transpose/ScatterElementsUpdate_1" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6499" name="__module.model.layers.27.self_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4803,k.55"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6500" name="__module.model.layers.27.self_attn/aten::mul/Multiply_2" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4825"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6501" name="__module.model.layers.27.self_attn/aten::size/ShapeOf_5" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6502" name="__module.model.layers.27.self_attn/aten::size/Constant_5" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="6503" name="__module.model.layers.27.self_attn/aten::size/Gather_5" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="4826,4831" /> + </output> + </layer> + <layer id="6504" name="__module.model.layers.27.self_attn/aten::floor_divide/Divide_3" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" /> + </output> + </layer> + <layer id="6505" name="__module.model.layers.27.self_attn/aten::floor_divide/Floor_3" type="Floor" version="opset1"> + <input> + <port id="0" precision="I64" /> + </input> + <output> + <port id="1" precision="I64" names="4828,4829,4833,4834" /> + </output> + </layer> + <layer id="6506" name="Constant_220951" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6507" name="__module.model.layers.27.self_attn/aten::slice/Reshape_13" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6508" name="__module.model.layers.27.self_attn/aten::slice/Reshape_9" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694676" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6509" name="__module.model.layers.27.self_attn/aten::slice/Reshape_10" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6510" name="__module.model.layers.27.self_attn/aten::slice/Reshape_11" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6511" name="__module.model.layers.27.self_attn/aten::slice/Slice_2" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="4835,x2.111"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="6512" name="Constant_290323" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1, 1" offset="792694684" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6513" name="__module.model.layers.27.self_attn/aten::neg/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4836"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="6514" name="__module.model.layers.27.self_attn/aten::slice/Reshape_12" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6515" name="__module.model.layers.27.self_attn/aten::slice/Reshape_14" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6516" name="__module.model.layers.27.self_attn/aten::slice/Reshape_15" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6517" name="__module.model.layers.27.self_attn/aten::slice/Slice_3" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="4830"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="6518" name="__module.model.layers.27.self_attn/aten::cat/Concat_1" type="Concat" version="opset1"> + <data axis="-1" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4838"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6519" name="__module.model.layers.27.self_attn/aten::mul/Multiply_3" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4839"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6520" name="__module.model.layers.27.self_attn/aten::add/Add_1" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4840"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6521" name="__module.model.layers.27.self_attn/aten::cat/Concat_2" type="Concat" version="opset1"> + <data axis="-2" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="present.27.key"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6522" name="__module.model.layers.27.self_attn/aten::unsqueeze/Unsqueeze_2" type="Unsqueeze" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="FP32" names="4852,4853,4854"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6523" name="__module.model.layers.27.self_attn/aten::size/ShapeOf_6" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6524" name="Constant_302499" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="938477672" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="6525" name="Constant_302500" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="6526" name="Gather_302501" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="6527" name="Constant_268806" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="795420624" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6528" name="Constant_277136" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795420632" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="6529" name="Constant_277137" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="6530" name="Gather_277138" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="6531" name="__module.model.layers.27.self_attn/prim::ListConstruct/Concat_2" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="3" precision="I64" names="4855"> + <dim>5</dim> + </port> + </output> + </layer> + <layer id="6532" name="__module.model.layers.27.self_attn/aten::expand/Broadcast" type="Broadcast" version="opset3"> + <data mode="bidirectional" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>5</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4856,hidden_states.821"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6533" name="Constant_301861" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420648" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6534" name="__module.model.layers.27.self_attn/aten::reshape/Reshape" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4860,key_states.115"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6535" name="Constant_341490" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="6536" name="Constant_341483" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="12" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6537" name="Constant_341485" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6538" name="Constant_341487" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="20" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6539" name="Concat_341488" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6540" name="Broadcast_341491" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32" /> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6541" name="ReadValue_333158" type="ReadValue" version="opset6"> + <data variable_id="past_key_values.27.valuepresent.27.value" variable_type="f32" variable_shape="?,8,?,128" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="past_key_values.27.value"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6542" name="Constant_325474" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="6543" name="Gather_325475" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6544" name="self.model.layers.27.self_attn.v_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 128" offset="4657956984" size="2621440" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6545" name="Convert_387537" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6546" name="self.model.layers.27.self_attn.v_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 1" offset="4660578424" size="20480" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6547" name="Convert_387539" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6548" name="self.model.layers.27.self_attn.v_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6549" name="self.model.layers.27.self_attn.v_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="1024, 40, 1" offset="4660598904" size="81920" /> + <output> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6550" name="self.model.layers.27.self_attn.v_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6551" name="Constant_387544" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795418528" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="6552" name="Reshape_387545" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="6553" name="__module.model.layers.27.self_attn.v_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="6554" name="__module.model.layers.27.self_attn.v_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="6555" name="self.model.layers.27.self_attn.v_proj.bias" type="Const" version="opset1"> + <data element_type="bf16" shape="1024" offset="4660680824" size="2048" /> + <output> + <port id="0" precision="BF16" names="self.model.layers.27.self_attn.v_proj.bias"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="6556" name="__module.model.layers.27.self_attn.v_proj/prim::PythonOp/ConvertLike_1" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="BF16"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="6557" name="__module.model.layers.27.self_attn.v_proj/prim::PythonOp/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4797,value_states.55"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="6558" name="Constant_301862" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420592" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6559" name="__module.model.layers.27.self_attn/aten::view/Reshape_2" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4805"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6560" name="__module.model.layers.27.self_attn/aten::transpose/ScatterElementsUpdate_2" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6561" name="__module.model.layers.27.self_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4806"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6562" name="__module.model.layers.27.self_attn/aten::cat/Concat_3" type="Concat" version="opset1"> + <data axis="-2" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="present.27.value"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6563" name="__module.model.layers.27.self_attn/aten::unsqueeze/Unsqueeze_3" type="Unsqueeze" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="FP32" names="4868,4869,4870"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6564" name="__module.model.layers.27.self_attn/aten::size/ShapeOf_10" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6565" name="Constant_302247" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6566" name="__module.model.layers.27.self_attn/aten::size/Constant_11" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="6567" name="__module.model.layers.27.self_attn/aten::size/Gather_11" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="4862"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6568" name="Constant_268824" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="795420624" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6569" name="Constant_277146" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795420632" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="6570" name="Constant_277147" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="6571" name="Gather_277148" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="6572" name="__module.model.layers.27.self_attn/prim::ListConstruct/Concat_5" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="4" precision="I64" names="4871"> + <dim>5</dim> + </port> + </output> + </layer> + <layer id="6573" name="__module.model.layers.27.self_attn/aten::expand/Broadcast_1" type="Broadcast" version="opset3"> + <data mode="bidirectional" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>5</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4872,hidden_states.825"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6574" name="Constant_301863" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420648" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6575" name="__module.model.layers.27.self_attn/aten::reshape/Reshape_1" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4876"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6576" name="__module.model.layers.27.self_attn/aten::slice/Reshape_60" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6577" name="ShapeOf_299902" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6578" name="Constant_299903" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694668" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6579" name="Constant_299904" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="6580" name="Gather_299905" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6581" name="ShapeOf_299906" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6582" name="Constant_299907" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694668" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6583" name="Constant_299908" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="6584" name="Gather_299909" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6585" name="Add_299910" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64" names="4877"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6586" name="__module.model.layers.27.self_attn/aten::slice/Reshape_62" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6587" name="__module.model.layers.27.self_attn/aten::slice/Reshape_63" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6588" name="__module.model.layers.27.self_attn/aten::slice/Slice_15" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="4881"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="6589" name="__module.model.layers.27.self_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> + <data causal="false" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="4882,attn_output.109"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6590" name="__module.model.layers.27.self_attn/aten::transpose/ScatterElementsUpdate_3" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6591" name="__module.model.layers.27.self_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4883"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6592" name="Constant_301864" type="Const" version="opset1"> + <data element_type="i64" shape="3" offset="798146608" size="24" /> + <output> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="6593" name="__module.model.layers.27.self_attn/aten::view/Reshape_3" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>3</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4886"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="6594" name="self.model.layers.27.self_attn.o_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 128" offset="4660682872" size="13107200" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6595" name="Convert_386577" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6596" name="self.model.layers.27.self_attn.o_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 1" offset="4673790072" size="102400" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6597" name="Convert_386579" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6598" name="self.model.layers.27.self_attn.o_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6599" name="self.model.layers.27.self_attn.o_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="5120, 40, 1" offset="4673892472" size="409600" /> + <output> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6600" name="self.model.layers.27.self_attn.o_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6601" name="Constant_386584" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="792684080" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="6602" name="Reshape_386585" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="6603" name="__module.model.layers.27.self_attn.o_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="6604" name="__module.model.layers.27.self_attn.o_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4888,4890,hidden_states.827"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="6605" name="__module.model.layers.27/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4893,4895,4906,hidden_states.829,hidden_states.831"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="6606" name="Constant_290327" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 5120" offset="4674302072" size="20480" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="6607" name="Constant_290326" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064860" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6608" name="Constant_290324" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064864" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6609" name="__module.model.layers.27.post_attention_layernorm/aten::pow/Power" type="Power" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4896"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="6610" name="Constant_19268" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64" names="4897"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6611" name="__module.model.layers.27.post_attention_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> + <data keep_dims="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4898,variance.111"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6612" name="Constant_290325" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064876" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6613" name="__module.model.layers.27.post_attention_layernorm/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4899"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6614" name="__module.model.layers.27.post_attention_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6615" name="__module.model.layers.27.post_attention_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4900"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6616" name="__module.model.layers.27.post_attention_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4901,4902,hidden_states.833,hidden_states.835"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="6617" name="__module.model.layers.27.post_attention_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4903,4905"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="6618" name="self.model.layers.27.mlp.gate_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 128" offset="4674322552" size="35389440" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6619" name="Convert_385407" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6620" name="self.model.layers.27.mlp.gate_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 1" offset="4709711992" size="276480" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6621" name="Convert_385409" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6622" name="self.model.layers.27.mlp.gate_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6623" name="self.model.layers.27.mlp.gate_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="13824, 40, 1" offset="4709988472" size="1105920" /> + <output> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6624" name="self.model.layers.27.mlp.gate_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6625" name="Constant_385414" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="848558152" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="6626" name="Reshape_385415" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="6627" name="__module.model.layers.27.mlp.gate_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="6628" name="__module.model.layers.27.mlp.gate_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4911,input.55"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="6629" name="__module.model.layers.27.mlp.act_fn/aten::silu/Swish" type="Swish" version="opset4"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="4912"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="6630" name="self.model.layers.27.mlp.up_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 128" offset="4711094392" size="35389440" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6631" name="Convert_385397" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6632" name="self.model.layers.27.mlp.up_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 1" offset="4746483832" size="276480" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6633" name="Convert_385399" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6634" name="self.model.layers.27.mlp.up_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6635" name="self.model.layers.27.mlp.up_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="13824, 40, 1" offset="4746760312" size="1105920" /> + <output> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6636" name="self.model.layers.27.mlp.up_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6637" name="Constant_385404" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="848558152" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="6638" name="Reshape_385405" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="6639" name="__module.model.layers.27.mlp.up_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="6640" name="__module.model.layers.27.mlp.up_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4914"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="6641" name="__module.model.layers.27.mlp/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4915"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="6642" name="self.model.layers.27.mlp.down_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 108, 128" offset="4747866232" size="35389440" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6643" name="Convert_385417" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6644" name="self.model.layers.27.mlp.down_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 108, 1" offset="4783255672" size="276480" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6645" name="Convert_385419" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6646" name="self.model.layers.27.mlp.down_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6647" name="self.model.layers.27.mlp.down_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="5120, 108, 1" offset="4783532152" size="1105920" /> + <output> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6648" name="self.model.layers.27.mlp.down_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6649" name="Constant_385424" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="922101848" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="6650" name="Reshape_385425" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="6651" name="__module.model.layers.27.mlp.down_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="6652" name="__module.model.layers.27.mlp.down_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4917,hidden_states.837"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="6653" name="__module.model.layers.27/aten::add/Add_1" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4918,4920,4928,4939,hidden_states.839,hidden_states.841"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="6654" name="Constant_290331" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 5120" offset="4784638072" size="20480" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="6655" name="Constant_290330" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064860" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6656" name="Constant_290328" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064864" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6657" name="__module.model.layers.28.input_layernorm/aten::pow/Power" type="Power" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4929"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="6658" name="Constant_19342" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64" names="4930"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6659" name="__module.model.layers.28.input_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> + <data keep_dims="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4931,variance.113"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6660" name="Constant_290329" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064876" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6661" name="__module.model.layers.28.input_layernorm/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4932"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6662" name="__module.model.layers.28.input_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6663" name="__module.model.layers.28.input_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4933"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6664" name="__module.model.layers.28.input_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4934,4935,hidden_states.843,hidden_states.845"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="6665" name="__module.model.layers.28.input_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4936,4938,hidden_states.847"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="6666" name="self.model.layers.28.self_attn.q_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 128" offset="4784658552" size="13107200" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6667" name="Convert_386587" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6668" name="self.model.layers.28.self_attn.q_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 1" offset="4797765752" size="102400" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6669" name="Convert_386589" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6670" name="self.model.layers.28.self_attn.q_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6671" name="self.model.layers.28.self_attn.q_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="5120, 40, 1" offset="4797868152" size="409600" /> + <output> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6672" name="self.model.layers.28.self_attn.q_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6673" name="Constant_386594" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="792684080" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="6674" name="Reshape_386595" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="6675" name="__module.model.layers.28.self_attn.q_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="6676" name="__module.model.layers.28.self_attn.q_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="6677" name="self.model.layers.28.self_attn.q_proj.bias" type="Const" version="opset1"> + <data element_type="bf16" shape="5120" offset="4798277752" size="10240" /> + <output> + <port id="0" precision="BF16" names="self.model.layers.28.self_attn.q_proj.bias"> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="6678" name="__module.model.layers.28.self_attn.q_proj/prim::PythonOp/ConvertLike_1" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="BF16"> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="6679" name="__module.model.layers.28.self_attn.q_proj/prim::PythonOp/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4948,query_states.57"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="6680" name="Constant_301865" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="792694336" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6681" name="__module.model.layers.28.self_attn/aten::view/Reshape" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4956"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6682" name="__module.model.layers.28.self_attn/aten::transpose/ScatterElementsUpdate" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6683" name="__module.model.layers.28.self_attn/aten::transpose/Transpose" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4957,q.57"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6684" name="__module.model.layers.28.self_attn/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4966"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6685" name="__module.model.layers.28.self_attn/aten::size/ShapeOf_3" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6686" name="__module.model.layers.28.self_attn/aten::size/Constant_3" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="6687" name="__module.model.layers.28.self_attn/aten::size/Gather_3" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="4967,4972" /> + </output> + </layer> + <layer id="6688" name="__module.model.layers.28.self_attn/aten::floor_divide/Divide_1" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" /> + </output> + </layer> + <layer id="6689" name="__module.model.layers.28.self_attn/aten::floor_divide/Floor_1" type="Floor" version="opset1"> + <input> + <port id="0" precision="I64" /> + </input> + <output> + <port id="1" precision="I64" names="4969,4970,4974,4975" /> + </output> + </layer> + <layer id="6690" name="Constant_220965" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6691" name="__module.model.layers.28.self_attn/aten::slice/Reshape_5" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6692" name="__module.model.layers.28.self_attn/aten::slice/Reshape_1" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694676" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6693" name="__module.model.layers.28.self_attn/aten::slice/Reshape_2" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6694" name="__module.model.layers.28.self_attn/aten::slice/Reshape_3" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6695" name="__module.model.layers.28.self_attn/aten::slice/Slice" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="4976,x2.113"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="6696" name="Constant_290332" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1, 1" offset="792694684" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6697" name="__module.model.layers.28.self_attn/aten::neg/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4977"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="6698" name="__module.model.layers.28.self_attn/aten::slice/Reshape_4" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6699" name="__module.model.layers.28.self_attn/aten::slice/Reshape_6" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6700" name="__module.model.layers.28.self_attn/aten::slice/Reshape_7" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6701" name="__module.model.layers.28.self_attn/aten::slice/Slice_1" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="4971"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="6702" name="__module.model.layers.28.self_attn/aten::cat/Concat" type="Concat" version="opset1"> + <data axis="-1" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4979"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6703" name="__module.model.layers.28.self_attn/aten::mul/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4980"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6704" name="__module.model.layers.28.self_attn/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4981"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6705" name="Constant_341503" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="6706" name="Constant_341496" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="12" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6707" name="Constant_341498" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6708" name="Constant_341500" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="20" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6709" name="Concat_341501" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6710" name="Broadcast_341504" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32" /> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6711" name="ReadValue_333160" type="ReadValue" version="opset6"> + <data variable_id="past_key_values.28.keypresent.28.key" variable_type="f32" variable_shape="?,8,?,128" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="past_key_values.28.key"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6712" name="Constant_325477" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="6713" name="Gather_325478" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6714" name="self.model.layers.28.self_attn.k_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 128" offset="4798287992" size="2621440" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6715" name="Convert_387547" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6716" name="self.model.layers.28.self_attn.k_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 1" offset="4800909432" size="20480" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6717" name="Convert_387549" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6718" name="self.model.layers.28.self_attn.k_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6719" name="self.model.layers.28.self_attn.k_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="1024, 40, 1" offset="4800929912" size="81920" /> + <output> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6720" name="self.model.layers.28.self_attn.k_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6721" name="Constant_387554" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795418528" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="6722" name="Reshape_387555" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="6723" name="__module.model.layers.28.self_attn.k_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="6724" name="__module.model.layers.28.self_attn.k_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="6725" name="self.model.layers.28.self_attn.k_proj.bias" type="Const" version="opset1"> + <data element_type="bf16" shape="1024" offset="4801011832" size="2048" /> + <output> + <port id="0" precision="BF16" names="self.model.layers.28.self_attn.k_proj.bias"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="6726" name="__module.model.layers.28.self_attn.k_proj/prim::PythonOp/ConvertLike_1" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="BF16"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="6727" name="__module.model.layers.28.self_attn.k_proj/prim::PythonOp/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4951,key_states.117"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="6728" name="Constant_301866" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420592" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6729" name="__module.model.layers.28.self_attn/aten::view/Reshape_1" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4959"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6730" name="__module.model.layers.28.self_attn/aten::transpose/ScatterElementsUpdate_1" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6731" name="__module.model.layers.28.self_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4960,k.57"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6732" name="__module.model.layers.28.self_attn/aten::mul/Multiply_2" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4982"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6733" name="__module.model.layers.28.self_attn/aten::size/ShapeOf_5" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6734" name="__module.model.layers.28.self_attn/aten::size/Constant_5" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="6735" name="__module.model.layers.28.self_attn/aten::size/Gather_5" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="4983,4988" /> + </output> + </layer> + <layer id="6736" name="__module.model.layers.28.self_attn/aten::floor_divide/Divide_3" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" /> + </output> + </layer> + <layer id="6737" name="__module.model.layers.28.self_attn/aten::floor_divide/Floor_3" type="Floor" version="opset1"> + <input> + <port id="0" precision="I64" /> + </input> + <output> + <port id="1" precision="I64" names="4985,4986,4990,4991" /> + </output> + </layer> + <layer id="6738" name="Constant_220966" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6739" name="__module.model.layers.28.self_attn/aten::slice/Reshape_13" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6740" name="__module.model.layers.28.self_attn/aten::slice/Reshape_9" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694676" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6741" name="__module.model.layers.28.self_attn/aten::slice/Reshape_10" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6742" name="__module.model.layers.28.self_attn/aten::slice/Reshape_11" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6743" name="__module.model.layers.28.self_attn/aten::slice/Slice_2" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="4992,x2.115"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="6744" name="Constant_290333" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1, 1" offset="792694684" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6745" name="__module.model.layers.28.self_attn/aten::neg/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4993"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="6746" name="__module.model.layers.28.self_attn/aten::slice/Reshape_12" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6747" name="__module.model.layers.28.self_attn/aten::slice/Reshape_14" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6748" name="__module.model.layers.28.self_attn/aten::slice/Reshape_15" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6749" name="__module.model.layers.28.self_attn/aten::slice/Slice_3" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="4987"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="6750" name="__module.model.layers.28.self_attn/aten::cat/Concat_1" type="Concat" version="opset1"> + <data axis="-1" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4995"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6751" name="__module.model.layers.28.self_attn/aten::mul/Multiply_3" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4996"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6752" name="__module.model.layers.28.self_attn/aten::add/Add_1" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4997"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6753" name="__module.model.layers.28.self_attn/aten::cat/Concat_2" type="Concat" version="opset1"> + <data axis="-2" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="present.28.key"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6754" name="__module.model.layers.28.self_attn/aten::unsqueeze/Unsqueeze_2" type="Unsqueeze" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="FP32" names="5009,5010,5011"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6755" name="__module.model.layers.28.self_attn/aten::size/ShapeOf_6" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6756" name="Constant_302504" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="938477672" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="6757" name="Constant_302505" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="6758" name="Gather_302506" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="6759" name="Constant_268842" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="795420624" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6760" name="Constant_277171" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795420632" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="6761" name="Constant_277172" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="6762" name="Gather_277173" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="6763" name="__module.model.layers.28.self_attn/prim::ListConstruct/Concat_2" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="3" precision="I64" names="5012"> + <dim>5</dim> + </port> + </output> + </layer> + <layer id="6764" name="__module.model.layers.28.self_attn/aten::expand/Broadcast" type="Broadcast" version="opset3"> + <data mode="bidirectional" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>5</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5013,hidden_states.851"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6765" name="Constant_301867" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420648" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6766" name="__module.model.layers.28.self_attn/aten::reshape/Reshape" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5017,key_states.119"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6767" name="Constant_341516" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="6768" name="Constant_341509" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="12" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6769" name="Constant_341511" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6770" name="Constant_341513" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="20" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6771" name="Concat_341514" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6772" name="Broadcast_341517" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32" /> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6773" name="ReadValue_333162" type="ReadValue" version="opset6"> + <data variable_id="past_key_values.28.valuepresent.28.value" variable_type="f32" variable_shape="?,8,?,128" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="past_key_values.28.value"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6774" name="Constant_325480" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="6775" name="Gather_325481" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6776" name="self.model.layers.28.self_attn.v_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 128" offset="4801013880" size="2621440" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6777" name="Convert_387557" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6778" name="self.model.layers.28.self_attn.v_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 1" offset="4803635320" size="20480" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6779" name="Convert_387559" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6780" name="self.model.layers.28.self_attn.v_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6781" name="self.model.layers.28.self_attn.v_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="1024, 40, 1" offset="4803655800" size="81920" /> + <output> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6782" name="self.model.layers.28.self_attn.v_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6783" name="Constant_387564" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795418528" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="6784" name="Reshape_387565" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="6785" name="__module.model.layers.28.self_attn.v_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="6786" name="__module.model.layers.28.self_attn.v_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="6787" name="self.model.layers.28.self_attn.v_proj.bias" type="Const" version="opset1"> + <data element_type="bf16" shape="1024" offset="4803737720" size="2048" /> + <output> + <port id="0" precision="BF16" names="self.model.layers.28.self_attn.v_proj.bias"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="6788" name="__module.model.layers.28.self_attn.v_proj/prim::PythonOp/ConvertLike_1" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="BF16"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="6789" name="__module.model.layers.28.self_attn.v_proj/prim::PythonOp/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4954,value_states.57"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="6790" name="Constant_301868" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420592" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6791" name="__module.model.layers.28.self_attn/aten::view/Reshape_2" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4962"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6792" name="__module.model.layers.28.self_attn/aten::transpose/ScatterElementsUpdate_2" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6793" name="__module.model.layers.28.self_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="4963"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6794" name="__module.model.layers.28.self_attn/aten::cat/Concat_3" type="Concat" version="opset1"> + <data axis="-2" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="present.28.value"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6795" name="__module.model.layers.28.self_attn/aten::unsqueeze/Unsqueeze_3" type="Unsqueeze" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="FP32" names="5025,5026,5027"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6796" name="__module.model.layers.28.self_attn/aten::size/ShapeOf_10" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6797" name="Constant_302253" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6798" name="__module.model.layers.28.self_attn/aten::size/Constant_11" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="6799" name="__module.model.layers.28.self_attn/aten::size/Gather_11" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="5019"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6800" name="Constant_268860" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="795420624" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6801" name="Constant_277181" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795420632" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="6802" name="Constant_277182" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="6803" name="Gather_277183" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="6804" name="__module.model.layers.28.self_attn/prim::ListConstruct/Concat_5" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="4" precision="I64" names="5028"> + <dim>5</dim> + </port> + </output> + </layer> + <layer id="6805" name="__module.model.layers.28.self_attn/aten::expand/Broadcast_1" type="Broadcast" version="opset3"> + <data mode="bidirectional" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>5</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5029,hidden_states.855"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6806" name="Constant_301869" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420648" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6807" name="__module.model.layers.28.self_attn/aten::reshape/Reshape_1" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5033"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6808" name="__module.model.layers.28.self_attn/aten::slice/Reshape_60" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6809" name="ShapeOf_299988" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6810" name="Constant_299989" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694668" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6811" name="Constant_299990" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="6812" name="Gather_299991" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6813" name="ShapeOf_299992" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6814" name="Constant_299993" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694668" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6815" name="Constant_299994" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="6816" name="Gather_299995" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6817" name="Add_299996" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64" names="5034"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6818" name="__module.model.layers.28.self_attn/aten::slice/Reshape_62" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6819" name="__module.model.layers.28.self_attn/aten::slice/Reshape_63" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6820" name="__module.model.layers.28.self_attn/aten::slice/Slice_15" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="5038"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="6821" name="__module.model.layers.28.self_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> + <data causal="false" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="5039,attn_output.113"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6822" name="__module.model.layers.28.self_attn/aten::transpose/ScatterElementsUpdate_3" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6823" name="__module.model.layers.28.self_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5040"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6824" name="Constant_301870" type="Const" version="opset1"> + <data element_type="i64" shape="3" offset="798146608" size="24" /> + <output> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="6825" name="__module.model.layers.28.self_attn/aten::view/Reshape_3" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>3</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5043"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="6826" name="self.model.layers.28.self_attn.o_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 128" offset="4803739768" size="13107200" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6827" name="Convert_386597" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6828" name="self.model.layers.28.self_attn.o_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 1" offset="4816846968" size="102400" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6829" name="Convert_386599" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6830" name="self.model.layers.28.self_attn.o_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6831" name="self.model.layers.28.self_attn.o_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="5120, 40, 1" offset="4816949368" size="409600" /> + <output> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6832" name="self.model.layers.28.self_attn.o_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6833" name="Constant_386604" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="792684080" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="6834" name="Reshape_386605" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="6835" name="__module.model.layers.28.self_attn.o_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="6836" name="__module.model.layers.28.self_attn.o_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5045,5047,hidden_states.857"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="6837" name="__module.model.layers.28/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5050,5052,5063,hidden_states.859,hidden_states.861"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="6838" name="Constant_290337" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 5120" offset="4817358968" size="20480" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="6839" name="Constant_290336" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064860" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6840" name="Constant_290334" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064864" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6841" name="__module.model.layers.28.post_attention_layernorm/aten::pow/Power" type="Power" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5053"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="6842" name="Constant_19940" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64" names="5054"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6843" name="__module.model.layers.28.post_attention_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> + <data keep_dims="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5055,variance.115"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6844" name="Constant_290335" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064876" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6845" name="__module.model.layers.28.post_attention_layernorm/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5056"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6846" name="__module.model.layers.28.post_attention_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6847" name="__module.model.layers.28.post_attention_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5057"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6848" name="__module.model.layers.28.post_attention_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5058,5059,hidden_states.863,hidden_states.865"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="6849" name="__module.model.layers.28.post_attention_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5060,5062"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="6850" name="self.model.layers.28.mlp.gate_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 128" offset="4817379448" size="35389440" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6851" name="Convert_385437" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6852" name="self.model.layers.28.mlp.gate_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 1" offset="4852768888" size="276480" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6853" name="Convert_385439" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6854" name="self.model.layers.28.mlp.gate_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6855" name="self.model.layers.28.mlp.gate_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="13824, 40, 1" offset="4853045368" size="1105920" /> + <output> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6856" name="self.model.layers.28.mlp.gate_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6857" name="Constant_385444" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="848558152" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="6858" name="Reshape_385445" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="6859" name="__module.model.layers.28.mlp.gate_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="6860" name="__module.model.layers.28.mlp.gate_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5068,input.57"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="6861" name="__module.model.layers.28.mlp.act_fn/aten::silu/Swish" type="Swish" version="opset4"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="5069"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="6862" name="self.model.layers.28.mlp.up_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 128" offset="4854151288" size="35389440" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6863" name="Convert_385427" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6864" name="self.model.layers.28.mlp.up_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 1" offset="4889540728" size="276480" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6865" name="Convert_385429" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6866" name="self.model.layers.28.mlp.up_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6867" name="self.model.layers.28.mlp.up_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="13824, 40, 1" offset="4889817208" size="1105920" /> + <output> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6868" name="self.model.layers.28.mlp.up_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6869" name="Constant_385434" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="848558152" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="6870" name="Reshape_385435" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="6871" name="__module.model.layers.28.mlp.up_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="6872" name="__module.model.layers.28.mlp.up_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5071"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="6873" name="__module.model.layers.28.mlp/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5072"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="6874" name="self.model.layers.28.mlp.down_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 108, 128" offset="4890923128" size="35389440" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6875" name="Convert_385447" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6876" name="self.model.layers.28.mlp.down_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 108, 1" offset="4926312568" size="276480" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6877" name="Convert_385449" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6878" name="self.model.layers.28.mlp.down_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6879" name="self.model.layers.28.mlp.down_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="5120, 108, 1" offset="4926589048" size="1105920" /> + <output> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6880" name="self.model.layers.28.mlp.down_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6881" name="Constant_385454" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="922101848" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="6882" name="Reshape_385455" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="6883" name="__module.model.layers.28.mlp.down_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="6884" name="__module.model.layers.28.mlp.down_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5074,hidden_states.867"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="6885" name="__module.model.layers.28/aten::add/Add_1" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5075,5077,5085,5096,hidden_states.869,hidden_states.871"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="6886" name="Constant_290341" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 5120" offset="4927694968" size="20480" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="6887" name="Constant_290340" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064860" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6888" name="Constant_290338" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064864" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6889" name="__module.model.layers.29.input_layernorm/aten::pow/Power" type="Power" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5086"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="6890" name="Constant_20014" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64" names="5087"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6891" name="__module.model.layers.29.input_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> + <data keep_dims="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5088,variance.117"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6892" name="Constant_290339" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064876" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6893" name="__module.model.layers.29.input_layernorm/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5089"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6894" name="__module.model.layers.29.input_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6895" name="__module.model.layers.29.input_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5090"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6896" name="__module.model.layers.29.input_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5091,5092,hidden_states.873,hidden_states.875"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="6897" name="__module.model.layers.29.input_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5093,5095,hidden_states.877"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="6898" name="self.model.layers.29.self_attn.q_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 128" offset="4927715448" size="13107200" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6899" name="Convert_386607" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6900" name="self.model.layers.29.self_attn.q_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 1" offset="4940822648" size="102400" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6901" name="Convert_386609" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6902" name="self.model.layers.29.self_attn.q_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6903" name="self.model.layers.29.self_attn.q_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="5120, 40, 1" offset="4940925048" size="409600" /> + <output> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6904" name="self.model.layers.29.self_attn.q_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6905" name="Constant_386614" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="792684080" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="6906" name="Reshape_386615" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="6907" name="__module.model.layers.29.self_attn.q_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="6908" name="__module.model.layers.29.self_attn.q_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="6909" name="self.model.layers.29.self_attn.q_proj.bias" type="Const" version="opset1"> + <data element_type="bf16" shape="5120" offset="4941334648" size="10240" /> + <output> + <port id="0" precision="BF16" names="self.model.layers.29.self_attn.q_proj.bias"> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="6910" name="__module.model.layers.29.self_attn.q_proj/prim::PythonOp/ConvertLike_1" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="BF16"> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="6911" name="__module.model.layers.29.self_attn.q_proj/prim::PythonOp/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5105,query_states.59"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="6912" name="Constant_301871" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="792694336" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6913" name="__module.model.layers.29.self_attn/aten::view/Reshape" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5113"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6914" name="__module.model.layers.29.self_attn/aten::transpose/ScatterElementsUpdate" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6915" name="__module.model.layers.29.self_attn/aten::transpose/Transpose" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5114,q.59"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6916" name="__module.model.layers.29.self_attn/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5123"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6917" name="__module.model.layers.29.self_attn/aten::size/ShapeOf_3" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6918" name="__module.model.layers.29.self_attn/aten::size/Constant_3" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="6919" name="__module.model.layers.29.self_attn/aten::size/Gather_3" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="5124,5129" /> + </output> + </layer> + <layer id="6920" name="__module.model.layers.29.self_attn/aten::floor_divide/Divide_1" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" /> + </output> + </layer> + <layer id="6921" name="__module.model.layers.29.self_attn/aten::floor_divide/Floor_1" type="Floor" version="opset1"> + <input> + <port id="0" precision="I64" /> + </input> + <output> + <port id="1" precision="I64" names="5126,5127,5131,5132" /> + </output> + </layer> + <layer id="6922" name="Constant_220980" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6923" name="__module.model.layers.29.self_attn/aten::slice/Reshape_5" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6924" name="__module.model.layers.29.self_attn/aten::slice/Reshape_1" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694676" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6925" name="__module.model.layers.29.self_attn/aten::slice/Reshape_2" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6926" name="__module.model.layers.29.self_attn/aten::slice/Reshape_3" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6927" name="__module.model.layers.29.self_attn/aten::slice/Slice" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="5133,x2.117"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="6928" name="Constant_290342" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1, 1" offset="792694684" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6929" name="__module.model.layers.29.self_attn/aten::neg/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5134"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="6930" name="__module.model.layers.29.self_attn/aten::slice/Reshape_4" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6931" name="__module.model.layers.29.self_attn/aten::slice/Reshape_6" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6932" name="__module.model.layers.29.self_attn/aten::slice/Reshape_7" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6933" name="__module.model.layers.29.self_attn/aten::slice/Slice_1" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="5128"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="6934" name="__module.model.layers.29.self_attn/aten::cat/Concat" type="Concat" version="opset1"> + <data axis="-1" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5136"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6935" name="__module.model.layers.29.self_attn/aten::mul/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5137"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6936" name="__module.model.layers.29.self_attn/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5138"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6937" name="Constant_341529" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="6938" name="Constant_341522" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="12" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6939" name="Constant_341524" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6940" name="Constant_341526" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="20" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6941" name="Concat_341527" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6942" name="Broadcast_341530" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32" /> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6943" name="ReadValue_333164" type="ReadValue" version="opset6"> + <data variable_id="past_key_values.29.keypresent.29.key" variable_type="f32" variable_shape="?,8,?,128" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="past_key_values.29.key"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6944" name="Constant_325483" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="6945" name="Gather_325484" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6946" name="self.model.layers.29.self_attn.k_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 128" offset="4941344888" size="2621440" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6947" name="Convert_387567" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6948" name="self.model.layers.29.self_attn.k_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 1" offset="4943966328" size="20480" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6949" name="Convert_387569" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6950" name="self.model.layers.29.self_attn.k_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6951" name="self.model.layers.29.self_attn.k_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="1024, 40, 1" offset="4943986808" size="81920" /> + <output> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6952" name="self.model.layers.29.self_attn.k_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6953" name="Constant_387574" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795418528" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="6954" name="Reshape_387575" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="6955" name="__module.model.layers.29.self_attn.k_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="6956" name="__module.model.layers.29.self_attn.k_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="6957" name="self.model.layers.29.self_attn.k_proj.bias" type="Const" version="opset1"> + <data element_type="bf16" shape="1024" offset="4944068728" size="2048" /> + <output> + <port id="0" precision="BF16" names="self.model.layers.29.self_attn.k_proj.bias"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="6958" name="__module.model.layers.29.self_attn.k_proj/prim::PythonOp/ConvertLike_1" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="BF16"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="6959" name="__module.model.layers.29.self_attn.k_proj/prim::PythonOp/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5108,key_states.121"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="6960" name="Constant_301872" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420592" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6961" name="__module.model.layers.29.self_attn/aten::view/Reshape_1" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5116"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6962" name="__module.model.layers.29.self_attn/aten::transpose/ScatterElementsUpdate_1" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6963" name="__module.model.layers.29.self_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5117,k.59"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6964" name="__module.model.layers.29.self_attn/aten::mul/Multiply_2" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5139"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6965" name="__module.model.layers.29.self_attn/aten::size/ShapeOf_5" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6966" name="__module.model.layers.29.self_attn/aten::size/Constant_5" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="6967" name="__module.model.layers.29.self_attn/aten::size/Gather_5" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="5140,5145" /> + </output> + </layer> + <layer id="6968" name="__module.model.layers.29.self_attn/aten::floor_divide/Divide_3" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" /> + </output> + </layer> + <layer id="6969" name="__module.model.layers.29.self_attn/aten::floor_divide/Floor_3" type="Floor" version="opset1"> + <input> + <port id="0" precision="I64" /> + </input> + <output> + <port id="1" precision="I64" names="5142,5143,5147,5148" /> + </output> + </layer> + <layer id="6970" name="Constant_220981" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6971" name="__module.model.layers.29.self_attn/aten::slice/Reshape_13" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6972" name="__module.model.layers.29.self_attn/aten::slice/Reshape_9" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694676" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6973" name="__module.model.layers.29.self_attn/aten::slice/Reshape_10" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6974" name="__module.model.layers.29.self_attn/aten::slice/Reshape_11" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6975" name="__module.model.layers.29.self_attn/aten::slice/Slice_2" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="5149,x2.119"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="6976" name="Constant_290343" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1, 1" offset="792694684" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6977" name="__module.model.layers.29.self_attn/aten::neg/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5150"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="6978" name="__module.model.layers.29.self_attn/aten::slice/Reshape_12" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6979" name="__module.model.layers.29.self_attn/aten::slice/Reshape_14" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6980" name="__module.model.layers.29.self_attn/aten::slice/Reshape_15" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6981" name="__module.model.layers.29.self_attn/aten::slice/Slice_3" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="5144"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="6982" name="__module.model.layers.29.self_attn/aten::cat/Concat_1" type="Concat" version="opset1"> + <data axis="-1" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5152"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6983" name="__module.model.layers.29.self_attn/aten::mul/Multiply_3" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5153"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6984" name="__module.model.layers.29.self_attn/aten::add/Add_1" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5154"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6985" name="__module.model.layers.29.self_attn/aten::cat/Concat_2" type="Concat" version="opset1"> + <data axis="-2" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="present.29.key"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6986" name="__module.model.layers.29.self_attn/aten::unsqueeze/Unsqueeze_2" type="Unsqueeze" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="FP32" names="5166,5167,5168"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6987" name="__module.model.layers.29.self_attn/aten::size/ShapeOf_6" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6988" name="Constant_302509" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="938477672" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="6989" name="Constant_302510" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="6990" name="Gather_302511" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="6991" name="Constant_268878" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="795420624" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="6992" name="Constant_277206" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795420632" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="6993" name="Constant_277207" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="6994" name="Gather_277208" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="6995" name="__module.model.layers.29.self_attn/prim::ListConstruct/Concat_2" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="3" precision="I64" names="5169"> + <dim>5</dim> + </port> + </output> + </layer> + <layer id="6996" name="__module.model.layers.29.self_attn/aten::expand/Broadcast" type="Broadcast" version="opset3"> + <data mode="bidirectional" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>5</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5170,hidden_states.881"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6997" name="Constant_301873" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420648" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="6998" name="__module.model.layers.29.self_attn/aten::reshape/Reshape" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5174,key_states.123"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="6999" name="Constant_341542" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="7000" name="Constant_341535" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="12" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7001" name="Constant_341537" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7002" name="Constant_341539" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="20" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7003" name="Concat_341540" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="7004" name="Broadcast_341543" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32" /> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7005" name="ReadValue_333166" type="ReadValue" version="opset6"> + <data variable_id="past_key_values.29.valuepresent.29.value" variable_type="f32" variable_shape="?,8,?,128" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="past_key_values.29.value"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7006" name="Constant_325486" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="7007" name="Gather_325487" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7008" name="self.model.layers.29.self_attn.v_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 128" offset="4944070776" size="2621440" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7009" name="Convert_387577" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7010" name="self.model.layers.29.self_attn.v_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 1" offset="4946692216" size="20480" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7011" name="Convert_387579" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7012" name="self.model.layers.29.self_attn.v_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7013" name="self.model.layers.29.self_attn.v_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="1024, 40, 1" offset="4946712696" size="81920" /> + <output> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7014" name="self.model.layers.29.self_attn.v_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7015" name="Constant_387584" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795418528" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="7016" name="Reshape_387585" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="7017" name="__module.model.layers.29.self_attn.v_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="7018" name="__module.model.layers.29.self_attn.v_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="7019" name="self.model.layers.29.self_attn.v_proj.bias" type="Const" version="opset1"> + <data element_type="bf16" shape="1024" offset="4946794616" size="2048" /> + <output> + <port id="0" precision="BF16" names="self.model.layers.29.self_attn.v_proj.bias"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="7020" name="__module.model.layers.29.self_attn.v_proj/prim::PythonOp/ConvertLike_1" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="BF16"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="7021" name="__module.model.layers.29.self_attn.v_proj/prim::PythonOp/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5111,value_states.59"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="7022" name="Constant_301874" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420592" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="7023" name="__module.model.layers.29.self_attn/aten::view/Reshape_2" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5119"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7024" name="__module.model.layers.29.self_attn/aten::transpose/ScatterElementsUpdate_2" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="7025" name="__module.model.layers.29.self_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5120"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7026" name="__module.model.layers.29.self_attn/aten::cat/Concat_3" type="Concat" version="opset1"> + <data axis="-2" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="present.29.value"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7027" name="__module.model.layers.29.self_attn/aten::unsqueeze/Unsqueeze_3" type="Unsqueeze" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="FP32" names="5182,5183,5184"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7028" name="__module.model.layers.29.self_attn/aten::size/ShapeOf_10" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="7029" name="Constant_302259" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7030" name="__module.model.layers.29.self_attn/aten::size/Constant_11" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="7031" name="__module.model.layers.29.self_attn/aten::size/Gather_11" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="5176"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7032" name="Constant_268896" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="795420624" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7033" name="Constant_277216" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795420632" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="7034" name="Constant_277217" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="7035" name="Gather_277218" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="7036" name="__module.model.layers.29.self_attn/prim::ListConstruct/Concat_5" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="4" precision="I64" names="5185"> + <dim>5</dim> + </port> + </output> + </layer> + <layer id="7037" name="__module.model.layers.29.self_attn/aten::expand/Broadcast_1" type="Broadcast" version="opset3"> + <data mode="bidirectional" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>5</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5186,hidden_states.885"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7038" name="Constant_301875" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420648" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="7039" name="__module.model.layers.29.self_attn/aten::reshape/Reshape_1" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5190"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7040" name="__module.model.layers.29.self_attn/aten::slice/Reshape_60" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7041" name="ShapeOf_300074" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="7042" name="Constant_300075" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694668" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7043" name="Constant_300076" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="7044" name="Gather_300077" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7045" name="ShapeOf_300078" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="7046" name="Constant_300079" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694668" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7047" name="Constant_300080" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="7048" name="Gather_300081" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7049" name="Add_300082" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64" names="5191"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7050" name="__module.model.layers.29.self_attn/aten::slice/Reshape_62" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7051" name="__module.model.layers.29.self_attn/aten::slice/Reshape_63" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7052" name="__module.model.layers.29.self_attn/aten::slice/Slice_15" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="5195"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="7053" name="__module.model.layers.29.self_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> + <data causal="false" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="5196,attn_output.117"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7054" name="__module.model.layers.29.self_attn/aten::transpose/ScatterElementsUpdate_3" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="7055" name="__module.model.layers.29.self_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5197"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7056" name="Constant_301876" type="Const" version="opset1"> + <data element_type="i64" shape="3" offset="798146608" size="24" /> + <output> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="7057" name="__module.model.layers.29.self_attn/aten::view/Reshape_3" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>3</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5200"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="7058" name="self.model.layers.29.self_attn.o_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 128" offset="4946796664" size="13107200" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7059" name="Convert_386617" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7060" name="self.model.layers.29.self_attn.o_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 1" offset="4959903864" size="102400" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7061" name="Convert_386619" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7062" name="self.model.layers.29.self_attn.o_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7063" name="self.model.layers.29.self_attn.o_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="5120, 40, 1" offset="4960006264" size="409600" /> + <output> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7064" name="self.model.layers.29.self_attn.o_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7065" name="Constant_386624" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="792684080" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="7066" name="Reshape_386625" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="7067" name="__module.model.layers.29.self_attn.o_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="7068" name="__module.model.layers.29.self_attn.o_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5202,5204,hidden_states.887"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="7069" name="__module.model.layers.29/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5207,5209,5220,hidden_states.889,hidden_states.891"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="7070" name="Constant_290347" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 5120" offset="4960415864" size="20480" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="7071" name="Constant_290346" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064860" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7072" name="Constant_290344" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064864" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7073" name="__module.model.layers.29.post_attention_layernorm/aten::pow/Power" type="Power" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5210"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="7074" name="Constant_20612" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64" names="5211"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7075" name="__module.model.layers.29.post_attention_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> + <data keep_dims="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5212,variance.119"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7076" name="Constant_290345" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064876" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7077" name="__module.model.layers.29.post_attention_layernorm/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5213"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7078" name="__module.model.layers.29.post_attention_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7079" name="__module.model.layers.29.post_attention_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5214"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7080" name="__module.model.layers.29.post_attention_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5215,5216,hidden_states.893,hidden_states.895"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="7081" name="__module.model.layers.29.post_attention_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5217,5219"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="7082" name="self.model.layers.29.mlp.gate_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 128" offset="4960436344" size="35389440" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7083" name="Convert_385467" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7084" name="self.model.layers.29.mlp.gate_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 1" offset="4995825784" size="276480" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7085" name="Convert_385469" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7086" name="self.model.layers.29.mlp.gate_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7087" name="self.model.layers.29.mlp.gate_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="13824, 40, 1" offset="4996102264" size="1105920" /> + <output> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7088" name="self.model.layers.29.mlp.gate_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7089" name="Constant_385474" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="848558152" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="7090" name="Reshape_385475" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="7091" name="__module.model.layers.29.mlp.gate_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="7092" name="__module.model.layers.29.mlp.gate_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5225,input.59"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="7093" name="__module.model.layers.29.mlp.act_fn/aten::silu/Swish" type="Swish" version="opset4"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="5226"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="7094" name="self.model.layers.29.mlp.up_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 128" offset="4997208184" size="35389440" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7095" name="Convert_385457" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7096" name="self.model.layers.29.mlp.up_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 1" offset="5032597624" size="276480" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7097" name="Convert_385459" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7098" name="self.model.layers.29.mlp.up_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7099" name="self.model.layers.29.mlp.up_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="13824, 40, 1" offset="5032874104" size="1105920" /> + <output> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7100" name="self.model.layers.29.mlp.up_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7101" name="Constant_385464" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="848558152" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="7102" name="Reshape_385465" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="7103" name="__module.model.layers.29.mlp.up_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="7104" name="__module.model.layers.29.mlp.up_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5228"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="7105" name="__module.model.layers.29.mlp/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5229"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="7106" name="self.model.layers.29.mlp.down_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 108, 128" offset="5033980024" size="35389440" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7107" name="Convert_385477" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7108" name="self.model.layers.29.mlp.down_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 108, 1" offset="5069369464" size="276480" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7109" name="Convert_385479" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7110" name="self.model.layers.29.mlp.down_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7111" name="self.model.layers.29.mlp.down_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="5120, 108, 1" offset="5069645944" size="1105920" /> + <output> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7112" name="self.model.layers.29.mlp.down_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7113" name="Constant_385484" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="922101848" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="7114" name="Reshape_385485" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="7115" name="__module.model.layers.29.mlp.down_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="7116" name="__module.model.layers.29.mlp.down_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5231,hidden_states.897"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="7117" name="__module.model.layers.29/aten::add/Add_1" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5232,5234,5242,5253,hidden_states.899,hidden_states.901"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="7118" name="Constant_290351" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 5120" offset="5070751864" size="20480" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="7119" name="Constant_290350" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064860" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7120" name="Constant_290348" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064864" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7121" name="__module.model.layers.30.input_layernorm/aten::pow/Power" type="Power" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5243"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="7122" name="Constant_20686" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64" names="5244"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7123" name="__module.model.layers.30.input_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> + <data keep_dims="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5245,variance.121"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7124" name="Constant_290349" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064876" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7125" name="__module.model.layers.30.input_layernorm/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5246"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7126" name="__module.model.layers.30.input_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7127" name="__module.model.layers.30.input_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5247"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7128" name="__module.model.layers.30.input_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5248,5249,hidden_states.903,hidden_states.905"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="7129" name="__module.model.layers.30.input_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5250,5252,hidden_states.907"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="7130" name="self.model.layers.30.self_attn.q_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 128" offset="5070772344" size="13107200" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7131" name="Convert_386627" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7132" name="self.model.layers.30.self_attn.q_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 1" offset="5083879544" size="102400" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7133" name="Convert_386629" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7134" name="self.model.layers.30.self_attn.q_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7135" name="self.model.layers.30.self_attn.q_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="5120, 40, 1" offset="5083981944" size="409600" /> + <output> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7136" name="self.model.layers.30.self_attn.q_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7137" name="Constant_386634" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="792684080" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="7138" name="Reshape_386635" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="7139" name="__module.model.layers.30.self_attn.q_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="7140" name="__module.model.layers.30.self_attn.q_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="7141" name="self.model.layers.30.self_attn.q_proj.bias" type="Const" version="opset1"> + <data element_type="bf16" shape="5120" offset="5084391544" size="10240" /> + <output> + <port id="0" precision="BF16" names="self.model.layers.30.self_attn.q_proj.bias"> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="7142" name="__module.model.layers.30.self_attn.q_proj/prim::PythonOp/ConvertLike_1" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="BF16"> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="7143" name="__module.model.layers.30.self_attn.q_proj/prim::PythonOp/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5262,query_states.61"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="7144" name="Constant_301877" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="792694336" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="7145" name="__module.model.layers.30.self_attn/aten::view/Reshape" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5270"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7146" name="__module.model.layers.30.self_attn/aten::transpose/ScatterElementsUpdate" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="7147" name="__module.model.layers.30.self_attn/aten::transpose/Transpose" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5271,q.61"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7148" name="__module.model.layers.30.self_attn/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5280"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7149" name="__module.model.layers.30.self_attn/aten::size/ShapeOf_3" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="7150" name="__module.model.layers.30.self_attn/aten::size/Constant_3" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="7151" name="__module.model.layers.30.self_attn/aten::size/Gather_3" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="5281,5286" /> + </output> + </layer> + <layer id="7152" name="__module.model.layers.30.self_attn/aten::floor_divide/Divide_1" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" /> + </output> + </layer> + <layer id="7153" name="__module.model.layers.30.self_attn/aten::floor_divide/Floor_1" type="Floor" version="opset1"> + <input> + <port id="0" precision="I64" /> + </input> + <output> + <port id="1" precision="I64" names="5283,5284,5288,5289" /> + </output> + </layer> + <layer id="7154" name="Constant_220995" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7155" name="__module.model.layers.30.self_attn/aten::slice/Reshape_5" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7156" name="__module.model.layers.30.self_attn/aten::slice/Reshape_1" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694676" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7157" name="__module.model.layers.30.self_attn/aten::slice/Reshape_2" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7158" name="__module.model.layers.30.self_attn/aten::slice/Reshape_3" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7159" name="__module.model.layers.30.self_attn/aten::slice/Slice" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="5290,x2.121"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="7160" name="Constant_290352" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1, 1" offset="792694684" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7161" name="__module.model.layers.30.self_attn/aten::neg/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5291"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="7162" name="__module.model.layers.30.self_attn/aten::slice/Reshape_4" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7163" name="__module.model.layers.30.self_attn/aten::slice/Reshape_6" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7164" name="__module.model.layers.30.self_attn/aten::slice/Reshape_7" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7165" name="__module.model.layers.30.self_attn/aten::slice/Slice_1" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="5285"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="7166" name="__module.model.layers.30.self_attn/aten::cat/Concat" type="Concat" version="opset1"> + <data axis="-1" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5293"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7167" name="__module.model.layers.30.self_attn/aten::mul/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5294"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7168" name="__module.model.layers.30.self_attn/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5295"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7169" name="Constant_341555" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="7170" name="Constant_341548" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="12" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7171" name="Constant_341550" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7172" name="Constant_341552" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="20" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7173" name="Concat_341553" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="7174" name="Broadcast_341556" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32" /> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7175" name="ReadValue_333172" type="ReadValue" version="opset6"> + <data variable_id="past_key_values.30.keypresent.30.key" variable_type="f32" variable_shape="?,8,?,128" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="past_key_values.30.key"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7176" name="Constant_325489" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="7177" name="Gather_325490" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7178" name="self.model.layers.30.self_attn.k_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 128" offset="5084401784" size="2621440" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7179" name="Convert_387587" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7180" name="self.model.layers.30.self_attn.k_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 1" offset="5087023224" size="20480" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7181" name="Convert_387589" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7182" name="self.model.layers.30.self_attn.k_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7183" name="self.model.layers.30.self_attn.k_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="1024, 40, 1" offset="5087043704" size="81920" /> + <output> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7184" name="self.model.layers.30.self_attn.k_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7185" name="Constant_387594" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795418528" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="7186" name="Reshape_387595" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="7187" name="__module.model.layers.30.self_attn.k_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="7188" name="__module.model.layers.30.self_attn.k_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="7189" name="self.model.layers.30.self_attn.k_proj.bias" type="Const" version="opset1"> + <data element_type="bf16" shape="1024" offset="5087125624" size="2048" /> + <output> + <port id="0" precision="BF16" names="self.model.layers.30.self_attn.k_proj.bias"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="7190" name="__module.model.layers.30.self_attn.k_proj/prim::PythonOp/ConvertLike_1" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="BF16"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="7191" name="__module.model.layers.30.self_attn.k_proj/prim::PythonOp/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5265,key_states.125"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="7192" name="Constant_301878" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420592" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="7193" name="__module.model.layers.30.self_attn/aten::view/Reshape_1" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5273"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7194" name="__module.model.layers.30.self_attn/aten::transpose/ScatterElementsUpdate_1" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="7195" name="__module.model.layers.30.self_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5274,k.61"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7196" name="__module.model.layers.30.self_attn/aten::mul/Multiply_2" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5296"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7197" name="__module.model.layers.30.self_attn/aten::size/ShapeOf_5" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="7198" name="__module.model.layers.30.self_attn/aten::size/Constant_5" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="7199" name="__module.model.layers.30.self_attn/aten::size/Gather_5" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="5297,5302" /> + </output> + </layer> + <layer id="7200" name="__module.model.layers.30.self_attn/aten::floor_divide/Divide_3" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" /> + </output> + </layer> + <layer id="7201" name="__module.model.layers.30.self_attn/aten::floor_divide/Floor_3" type="Floor" version="opset1"> + <input> + <port id="0" precision="I64" /> + </input> + <output> + <port id="1" precision="I64" names="5299,5300,5304,5305" /> + </output> + </layer> + <layer id="7202" name="Constant_220996" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7203" name="__module.model.layers.30.self_attn/aten::slice/Reshape_13" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7204" name="__module.model.layers.30.self_attn/aten::slice/Reshape_9" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694676" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7205" name="__module.model.layers.30.self_attn/aten::slice/Reshape_10" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7206" name="__module.model.layers.30.self_attn/aten::slice/Reshape_11" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7207" name="__module.model.layers.30.self_attn/aten::slice/Slice_2" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="5306,x2.123"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="7208" name="Constant_290353" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1, 1" offset="792694684" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7209" name="__module.model.layers.30.self_attn/aten::neg/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5307"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="7210" name="__module.model.layers.30.self_attn/aten::slice/Reshape_12" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7211" name="__module.model.layers.30.self_attn/aten::slice/Reshape_14" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7212" name="__module.model.layers.30.self_attn/aten::slice/Reshape_15" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7213" name="__module.model.layers.30.self_attn/aten::slice/Slice_3" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="5301"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="7214" name="__module.model.layers.30.self_attn/aten::cat/Concat_1" type="Concat" version="opset1"> + <data axis="-1" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5309"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7215" name="__module.model.layers.30.self_attn/aten::mul/Multiply_3" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5310"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7216" name="__module.model.layers.30.self_attn/aten::add/Add_1" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5311"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7217" name="__module.model.layers.30.self_attn/aten::cat/Concat_2" type="Concat" version="opset1"> + <data axis="-2" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="present.30.key"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7218" name="__module.model.layers.30.self_attn/aten::unsqueeze/Unsqueeze_2" type="Unsqueeze" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="FP32" names="5323,5324,5325"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7219" name="__module.model.layers.30.self_attn/aten::size/ShapeOf_6" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="7220" name="Constant_302514" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="938477672" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="7221" name="Constant_302515" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="7222" name="Gather_302516" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="7223" name="Constant_268914" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="795420624" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7224" name="Constant_277241" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795420632" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="7225" name="Constant_277242" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="7226" name="Gather_277243" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="7227" name="__module.model.layers.30.self_attn/prim::ListConstruct/Concat_2" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="3" precision="I64" names="5326"> + <dim>5</dim> + </port> + </output> + </layer> + <layer id="7228" name="__module.model.layers.30.self_attn/aten::expand/Broadcast" type="Broadcast" version="opset3"> + <data mode="bidirectional" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>5</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5327,hidden_states.911"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7229" name="Constant_301879" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420648" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="7230" name="__module.model.layers.30.self_attn/aten::reshape/Reshape" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5331,key_states.127"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7231" name="Constant_341568" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="7232" name="Constant_341561" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="12" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7233" name="Constant_341563" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7234" name="Constant_341565" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="20" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7235" name="Concat_341566" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="7236" name="Broadcast_341569" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32" /> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7237" name="ReadValue_333174" type="ReadValue" version="opset6"> + <data variable_id="past_key_values.30.valuepresent.30.value" variable_type="f32" variable_shape="?,8,?,128" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="past_key_values.30.value"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7238" name="Constant_325492" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="7239" name="Gather_325493" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7240" name="self.model.layers.30.self_attn.v_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 128" offset="5087127672" size="2621440" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7241" name="Convert_387597" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7242" name="self.model.layers.30.self_attn.v_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 1" offset="5089749112" size="20480" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7243" name="Convert_387599" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7244" name="self.model.layers.30.self_attn.v_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7245" name="self.model.layers.30.self_attn.v_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="1024, 40, 1" offset="5089769592" size="81920" /> + <output> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7246" name="self.model.layers.30.self_attn.v_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7247" name="Constant_387604" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795418528" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="7248" name="Reshape_387605" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="7249" name="__module.model.layers.30.self_attn.v_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="7250" name="__module.model.layers.30.self_attn.v_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="7251" name="self.model.layers.30.self_attn.v_proj.bias" type="Const" version="opset1"> + <data element_type="bf16" shape="1024" offset="5089851512" size="2048" /> + <output> + <port id="0" precision="BF16" names="self.model.layers.30.self_attn.v_proj.bias"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="7252" name="__module.model.layers.30.self_attn.v_proj/prim::PythonOp/ConvertLike_1" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="BF16"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="7253" name="__module.model.layers.30.self_attn.v_proj/prim::PythonOp/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5268,value_states.61"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="7254" name="Constant_301880" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420592" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="7255" name="__module.model.layers.30.self_attn/aten::view/Reshape_2" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5276"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7256" name="__module.model.layers.30.self_attn/aten::transpose/ScatterElementsUpdate_2" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="7257" name="__module.model.layers.30.self_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5277"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7258" name="__module.model.layers.30.self_attn/aten::cat/Concat_3" type="Concat" version="opset1"> + <data axis="-2" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="present.30.value"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7259" name="__module.model.layers.30.self_attn/aten::unsqueeze/Unsqueeze_3" type="Unsqueeze" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="FP32" names="5339,5340,5341"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7260" name="__module.model.layers.30.self_attn/aten::size/ShapeOf_10" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="7261" name="Constant_302265" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7262" name="__module.model.layers.30.self_attn/aten::size/Constant_11" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="7263" name="__module.model.layers.30.self_attn/aten::size/Gather_11" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="5333"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7264" name="Constant_268932" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="795420624" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7265" name="Constant_277251" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795420632" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="7266" name="Constant_277252" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="7267" name="Gather_277253" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="7268" name="__module.model.layers.30.self_attn/prim::ListConstruct/Concat_5" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="4" precision="I64" names="5342"> + <dim>5</dim> + </port> + </output> + </layer> + <layer id="7269" name="__module.model.layers.30.self_attn/aten::expand/Broadcast_1" type="Broadcast" version="opset3"> + <data mode="bidirectional" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>5</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5343,hidden_states.915"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7270" name="Constant_301881" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420648" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="7271" name="__module.model.layers.30.self_attn/aten::reshape/Reshape_1" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5347"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7272" name="__module.model.layers.30.self_attn/aten::slice/Reshape_60" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7273" name="ShapeOf_300160" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="7274" name="Constant_300161" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694668" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7275" name="Constant_300162" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="7276" name="Gather_300163" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7277" name="ShapeOf_300164" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="7278" name="Constant_300165" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694668" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7279" name="Constant_300166" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="7280" name="Gather_300167" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7281" name="Add_300168" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64" names="5348"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7282" name="__module.model.layers.30.self_attn/aten::slice/Reshape_62" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7283" name="__module.model.layers.30.self_attn/aten::slice/Reshape_63" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7284" name="__module.model.layers.30.self_attn/aten::slice/Slice_15" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="5352"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="7285" name="__module.model.layers.30.self_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> + <data causal="false" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="5353,attn_output.121"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7286" name="__module.model.layers.30.self_attn/aten::transpose/ScatterElementsUpdate_3" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="7287" name="__module.model.layers.30.self_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5354"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7288" name="Constant_301882" type="Const" version="opset1"> + <data element_type="i64" shape="3" offset="798146608" size="24" /> + <output> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="7289" name="__module.model.layers.30.self_attn/aten::view/Reshape_3" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>3</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5357"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="7290" name="self.model.layers.30.self_attn.o_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 128" offset="5089853560" size="13107200" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7291" name="Convert_386637" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7292" name="self.model.layers.30.self_attn.o_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 1" offset="5102960760" size="102400" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7293" name="Convert_386639" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7294" name="self.model.layers.30.self_attn.o_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7295" name="self.model.layers.30.self_attn.o_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="5120, 40, 1" offset="5103063160" size="409600" /> + <output> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7296" name="self.model.layers.30.self_attn.o_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7297" name="Constant_386644" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="792684080" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="7298" name="Reshape_386645" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="7299" name="__module.model.layers.30.self_attn.o_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="7300" name="__module.model.layers.30.self_attn.o_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5359,5361,hidden_states.917"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="7301" name="__module.model.layers.30/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5364,5366,5377,hidden_states.919,hidden_states.921"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="7302" name="Constant_290357" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 5120" offset="5103472760" size="20480" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="7303" name="Constant_290356" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064860" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7304" name="Constant_290354" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064864" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7305" name="__module.model.layers.30.post_attention_layernorm/aten::pow/Power" type="Power" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5367"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="7306" name="Constant_21284" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64" names="5368"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7307" name="__module.model.layers.30.post_attention_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> + <data keep_dims="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5369,variance.123"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7308" name="Constant_290355" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064876" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7309" name="__module.model.layers.30.post_attention_layernorm/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5370"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7310" name="__module.model.layers.30.post_attention_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7311" name="__module.model.layers.30.post_attention_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5371"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7312" name="__module.model.layers.30.post_attention_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5372,5373,hidden_states.923,hidden_states.925"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="7313" name="__module.model.layers.30.post_attention_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5374,5376"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="7314" name="self.model.layers.30.mlp.gate_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 128" offset="5103493240" size="35389440" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7315" name="Convert_385497" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7316" name="self.model.layers.30.mlp.gate_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 1" offset="5138882680" size="276480" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7317" name="Convert_385499" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7318" name="self.model.layers.30.mlp.gate_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7319" name="self.model.layers.30.mlp.gate_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="13824, 40, 1" offset="5139159160" size="1105920" /> + <output> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7320" name="self.model.layers.30.mlp.gate_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7321" name="Constant_385504" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="848558152" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="7322" name="Reshape_385505" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="7323" name="__module.model.layers.30.mlp.gate_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="7324" name="__module.model.layers.30.mlp.gate_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5382,input.61"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="7325" name="__module.model.layers.30.mlp.act_fn/aten::silu/Swish" type="Swish" version="opset4"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="5383"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="7326" name="self.model.layers.30.mlp.up_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 128" offset="5140265080" size="35389440" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7327" name="Convert_385487" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7328" name="self.model.layers.30.mlp.up_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 1" offset="5175654520" size="276480" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7329" name="Convert_385489" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7330" name="self.model.layers.30.mlp.up_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7331" name="self.model.layers.30.mlp.up_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="13824, 40, 1" offset="5175931000" size="1105920" /> + <output> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7332" name="self.model.layers.30.mlp.up_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7333" name="Constant_385494" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="848558152" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="7334" name="Reshape_385495" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="7335" name="__module.model.layers.30.mlp.up_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="7336" name="__module.model.layers.30.mlp.up_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5385"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="7337" name="__module.model.layers.30.mlp/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5386"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="7338" name="self.model.layers.30.mlp.down_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 108, 128" offset="5177036920" size="35389440" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7339" name="Convert_385507" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7340" name="self.model.layers.30.mlp.down_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 108, 1" offset="5212426360" size="276480" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7341" name="Convert_385509" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7342" name="self.model.layers.30.mlp.down_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7343" name="self.model.layers.30.mlp.down_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="5120, 108, 1" offset="5212702840" size="1105920" /> + <output> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7344" name="self.model.layers.30.mlp.down_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7345" name="Constant_385514" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="922101848" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="7346" name="Reshape_385515" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="7347" name="__module.model.layers.30.mlp.down_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="7348" name="__module.model.layers.30.mlp.down_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5388,hidden_states.927"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="7349" name="__module.model.layers.30/aten::add/Add_1" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5389,5391,5399,5410,hidden_states.929,hidden_states.931"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="7350" name="Constant_290361" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 5120" offset="5213808760" size="20480" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="7351" name="Constant_290360" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064860" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7352" name="Constant_290358" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064864" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7353" name="__module.model.layers.31.input_layernorm/aten::pow/Power" type="Power" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5400"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="7354" name="Constant_21358" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64" names="5401"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7355" name="__module.model.layers.31.input_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> + <data keep_dims="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5402,variance.125"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7356" name="Constant_290359" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064876" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7357" name="__module.model.layers.31.input_layernorm/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5403"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7358" name="__module.model.layers.31.input_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7359" name="__module.model.layers.31.input_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5404"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7360" name="__module.model.layers.31.input_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5405,5406,hidden_states.933,hidden_states.935"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="7361" name="__module.model.layers.31.input_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5407,5409,hidden_states.937"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="7362" name="self.model.layers.31.self_attn.q_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 128" offset="5213829240" size="13107200" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7363" name="Convert_386647" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7364" name="self.model.layers.31.self_attn.q_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 1" offset="5226936440" size="102400" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7365" name="Convert_386649" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7366" name="self.model.layers.31.self_attn.q_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7367" name="self.model.layers.31.self_attn.q_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="5120, 40, 1" offset="5227038840" size="409600" /> + <output> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7368" name="self.model.layers.31.self_attn.q_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7369" name="Constant_386654" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="792684080" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="7370" name="Reshape_386655" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="7371" name="__module.model.layers.31.self_attn.q_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="7372" name="__module.model.layers.31.self_attn.q_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="7373" name="self.model.layers.31.self_attn.q_proj.bias" type="Const" version="opset1"> + <data element_type="bf16" shape="5120" offset="5227448440" size="10240" /> + <output> + <port id="0" precision="BF16" names="self.model.layers.31.self_attn.q_proj.bias"> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="7374" name="__module.model.layers.31.self_attn.q_proj/prim::PythonOp/ConvertLike_1" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="BF16"> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="7375" name="__module.model.layers.31.self_attn.q_proj/prim::PythonOp/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5419,query_states.63"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="7376" name="Constant_301883" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="792694336" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="7377" name="__module.model.layers.31.self_attn/aten::view/Reshape" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5427"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7378" name="__module.model.layers.31.self_attn/aten::transpose/ScatterElementsUpdate" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="7379" name="__module.model.layers.31.self_attn/aten::transpose/Transpose" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5428,q.63"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7380" name="__module.model.layers.31.self_attn/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5437"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7381" name="__module.model.layers.31.self_attn/aten::size/ShapeOf_3" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="7382" name="__module.model.layers.31.self_attn/aten::size/Constant_3" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="7383" name="__module.model.layers.31.self_attn/aten::size/Gather_3" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="5438,5443" /> + </output> + </layer> + <layer id="7384" name="__module.model.layers.31.self_attn/aten::floor_divide/Divide_1" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" /> + </output> + </layer> + <layer id="7385" name="__module.model.layers.31.self_attn/aten::floor_divide/Floor_1" type="Floor" version="opset1"> + <input> + <port id="0" precision="I64" /> + </input> + <output> + <port id="1" precision="I64" names="5440,5441,5445,5446" /> + </output> + </layer> + <layer id="7386" name="Constant_221010" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7387" name="__module.model.layers.31.self_attn/aten::slice/Reshape_5" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7388" name="__module.model.layers.31.self_attn/aten::slice/Reshape_1" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694676" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7389" name="__module.model.layers.31.self_attn/aten::slice/Reshape_2" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7390" name="__module.model.layers.31.self_attn/aten::slice/Reshape_3" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7391" name="__module.model.layers.31.self_attn/aten::slice/Slice" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="5447,x2.125"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="7392" name="Constant_290362" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1, 1" offset="792694684" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7393" name="__module.model.layers.31.self_attn/aten::neg/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5448"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="7394" name="__module.model.layers.31.self_attn/aten::slice/Reshape_4" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7395" name="__module.model.layers.31.self_attn/aten::slice/Reshape_6" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7396" name="__module.model.layers.31.self_attn/aten::slice/Reshape_7" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7397" name="__module.model.layers.31.self_attn/aten::slice/Slice_1" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="5442"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="7398" name="__module.model.layers.31.self_attn/aten::cat/Concat" type="Concat" version="opset1"> + <data axis="-1" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5450"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7399" name="__module.model.layers.31.self_attn/aten::mul/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5451"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7400" name="__module.model.layers.31.self_attn/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5452"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7401" name="Constant_341581" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="7402" name="Constant_341574" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="12" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7403" name="Constant_341576" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7404" name="Constant_341578" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="20" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7405" name="Concat_341579" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="7406" name="Broadcast_341582" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32" /> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7407" name="ReadValue_333176" type="ReadValue" version="opset6"> + <data variable_id="past_key_values.31.keypresent.31.key" variable_type="f32" variable_shape="?,8,?,128" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="past_key_values.31.key"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7408" name="Constant_325495" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="7409" name="Gather_325496" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7410" name="self.model.layers.31.self_attn.k_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 128" offset="5227458680" size="2621440" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7411" name="Convert_387607" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7412" name="self.model.layers.31.self_attn.k_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 1" offset="5230080120" size="20480" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7413" name="Convert_387609" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7414" name="self.model.layers.31.self_attn.k_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7415" name="self.model.layers.31.self_attn.k_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="1024, 40, 1" offset="5230100600" size="81920" /> + <output> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7416" name="self.model.layers.31.self_attn.k_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7417" name="Constant_387614" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795418528" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="7418" name="Reshape_387615" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="7419" name="__module.model.layers.31.self_attn.k_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="7420" name="__module.model.layers.31.self_attn.k_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="7421" name="self.model.layers.31.self_attn.k_proj.bias" type="Const" version="opset1"> + <data element_type="bf16" shape="1024" offset="5230182520" size="2048" /> + <output> + <port id="0" precision="BF16" names="self.model.layers.31.self_attn.k_proj.bias"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="7422" name="__module.model.layers.31.self_attn.k_proj/prim::PythonOp/ConvertLike_1" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="BF16"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="7423" name="__module.model.layers.31.self_attn.k_proj/prim::PythonOp/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5422,key_states.129"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="7424" name="Constant_301884" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420592" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="7425" name="__module.model.layers.31.self_attn/aten::view/Reshape_1" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5430"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7426" name="__module.model.layers.31.self_attn/aten::transpose/ScatterElementsUpdate_1" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="7427" name="__module.model.layers.31.self_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5431,k.63"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7428" name="__module.model.layers.31.self_attn/aten::mul/Multiply_2" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5453"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7429" name="__module.model.layers.31.self_attn/aten::size/ShapeOf_5" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="7430" name="__module.model.layers.31.self_attn/aten::size/Constant_5" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="7431" name="__module.model.layers.31.self_attn/aten::size/Gather_5" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="5454,5459" /> + </output> + </layer> + <layer id="7432" name="__module.model.layers.31.self_attn/aten::floor_divide/Divide_3" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" /> + </output> + </layer> + <layer id="7433" name="__module.model.layers.31.self_attn/aten::floor_divide/Floor_3" type="Floor" version="opset1"> + <input> + <port id="0" precision="I64" /> + </input> + <output> + <port id="1" precision="I64" names="5456,5457,5461,5462" /> + </output> + </layer> + <layer id="7434" name="Constant_221011" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7435" name="__module.model.layers.31.self_attn/aten::slice/Reshape_13" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7436" name="__module.model.layers.31.self_attn/aten::slice/Reshape_9" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694676" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7437" name="__module.model.layers.31.self_attn/aten::slice/Reshape_10" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7438" name="__module.model.layers.31.self_attn/aten::slice/Reshape_11" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7439" name="__module.model.layers.31.self_attn/aten::slice/Slice_2" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="5463,x2.127"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="7440" name="Constant_290363" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1, 1" offset="792694684" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7441" name="__module.model.layers.31.self_attn/aten::neg/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5464"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="7442" name="__module.model.layers.31.self_attn/aten::slice/Reshape_12" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7443" name="__module.model.layers.31.self_attn/aten::slice/Reshape_14" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7444" name="__module.model.layers.31.self_attn/aten::slice/Reshape_15" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7445" name="__module.model.layers.31.self_attn/aten::slice/Slice_3" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="5458"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="7446" name="__module.model.layers.31.self_attn/aten::cat/Concat_1" type="Concat" version="opset1"> + <data axis="-1" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5466"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7447" name="__module.model.layers.31.self_attn/aten::mul/Multiply_3" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5467"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7448" name="__module.model.layers.31.self_attn/aten::add/Add_1" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5468"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7449" name="__module.model.layers.31.self_attn/aten::cat/Concat_2" type="Concat" version="opset1"> + <data axis="-2" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="present.31.key"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7450" name="__module.model.layers.31.self_attn/aten::unsqueeze/Unsqueeze_2" type="Unsqueeze" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="FP32" names="5480,5481,5482"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7451" name="__module.model.layers.31.self_attn/aten::size/ShapeOf_6" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="7452" name="Constant_302519" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="938477672" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="7453" name="Constant_302520" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="7454" name="Gather_302521" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="7455" name="Constant_268950" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="795420624" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7456" name="Constant_277276" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795420632" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="7457" name="Constant_277277" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="7458" name="Gather_277278" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="7459" name="__module.model.layers.31.self_attn/prim::ListConstruct/Concat_2" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="3" precision="I64" names="5483"> + <dim>5</dim> + </port> + </output> + </layer> + <layer id="7460" name="__module.model.layers.31.self_attn/aten::expand/Broadcast" type="Broadcast" version="opset3"> + <data mode="bidirectional" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>5</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5484,hidden_states.941"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7461" name="Constant_301885" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420648" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="7462" name="__module.model.layers.31.self_attn/aten::reshape/Reshape" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5488,key_states.131"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7463" name="Constant_341594" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="7464" name="Constant_341587" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="12" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7465" name="Constant_341589" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7466" name="Constant_341591" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="20" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7467" name="Concat_341592" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="7468" name="Broadcast_341595" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32" /> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7469" name="ReadValue_333178" type="ReadValue" version="opset6"> + <data variable_id="past_key_values.31.valuepresent.31.value" variable_type="f32" variable_shape="?,8,?,128" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="past_key_values.31.value"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7470" name="Constant_325498" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="7471" name="Gather_325499" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7472" name="self.model.layers.31.self_attn.v_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 128" offset="5230184568" size="2621440" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7473" name="Convert_387617" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7474" name="self.model.layers.31.self_attn.v_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 1" offset="5232806008" size="20480" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7475" name="Convert_387619" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7476" name="self.model.layers.31.self_attn.v_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7477" name="self.model.layers.31.self_attn.v_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="1024, 40, 1" offset="5232826488" size="81920" /> + <output> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7478" name="self.model.layers.31.self_attn.v_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7479" name="Constant_387624" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795418528" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="7480" name="Reshape_387625" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="7481" name="__module.model.layers.31.self_attn.v_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="7482" name="__module.model.layers.31.self_attn.v_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="7483" name="self.model.layers.31.self_attn.v_proj.bias" type="Const" version="opset1"> + <data element_type="bf16" shape="1024" offset="5232908408" size="2048" /> + <output> + <port id="0" precision="BF16" names="self.model.layers.31.self_attn.v_proj.bias"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="7484" name="__module.model.layers.31.self_attn.v_proj/prim::PythonOp/ConvertLike_1" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="BF16"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="7485" name="__module.model.layers.31.self_attn.v_proj/prim::PythonOp/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5425,value_states.63"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="7486" name="Constant_301886" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420592" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="7487" name="__module.model.layers.31.self_attn/aten::view/Reshape_2" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5433"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7488" name="__module.model.layers.31.self_attn/aten::transpose/ScatterElementsUpdate_2" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="7489" name="__module.model.layers.31.self_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5434"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7490" name="__module.model.layers.31.self_attn/aten::cat/Concat_3" type="Concat" version="opset1"> + <data axis="-2" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="present.31.value"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7491" name="__module.model.layers.31.self_attn/aten::unsqueeze/Unsqueeze_3" type="Unsqueeze" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="FP32" names="5496,5497,5498"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7492" name="__module.model.layers.31.self_attn/aten::size/ShapeOf_10" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="7493" name="Constant_302271" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7494" name="__module.model.layers.31.self_attn/aten::size/Constant_11" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="7495" name="__module.model.layers.31.self_attn/aten::size/Gather_11" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="5490"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7496" name="Constant_268968" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="795420624" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7497" name="Constant_277286" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795420632" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="7498" name="Constant_277287" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="7499" name="Gather_277288" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="7500" name="__module.model.layers.31.self_attn/prim::ListConstruct/Concat_5" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="4" precision="I64" names="5499"> + <dim>5</dim> + </port> + </output> + </layer> + <layer id="7501" name="__module.model.layers.31.self_attn/aten::expand/Broadcast_1" type="Broadcast" version="opset3"> + <data mode="bidirectional" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>5</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5500,hidden_states.945"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7502" name="Constant_301887" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420648" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="7503" name="__module.model.layers.31.self_attn/aten::reshape/Reshape_1" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5504"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7504" name="__module.model.layers.31.self_attn/aten::slice/Reshape_60" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7505" name="ShapeOf_300246" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="7506" name="Constant_300247" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694668" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7507" name="Constant_300248" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="7508" name="Gather_300249" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7509" name="ShapeOf_300250" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="7510" name="Constant_300251" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694668" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7511" name="Constant_300252" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="7512" name="Gather_300253" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7513" name="Add_300254" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64" names="5505"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7514" name="__module.model.layers.31.self_attn/aten::slice/Reshape_62" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7515" name="__module.model.layers.31.self_attn/aten::slice/Reshape_63" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7516" name="__module.model.layers.31.self_attn/aten::slice/Slice_15" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="5509"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="7517" name="__module.model.layers.31.self_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> + <data causal="false" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="5510,attn_output.125"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7518" name="__module.model.layers.31.self_attn/aten::transpose/ScatterElementsUpdate_3" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="7519" name="__module.model.layers.31.self_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5511"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7520" name="Constant_301888" type="Const" version="opset1"> + <data element_type="i64" shape="3" offset="798146608" size="24" /> + <output> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="7521" name="__module.model.layers.31.self_attn/aten::view/Reshape_3" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>3</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5514"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="7522" name="self.model.layers.31.self_attn.o_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 128" offset="5232910456" size="13107200" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7523" name="Convert_386657" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7524" name="self.model.layers.31.self_attn.o_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 1" offset="5246017656" size="102400" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7525" name="Convert_386659" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7526" name="self.model.layers.31.self_attn.o_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7527" name="self.model.layers.31.self_attn.o_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="5120, 40, 1" offset="5246120056" size="409600" /> + <output> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7528" name="self.model.layers.31.self_attn.o_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7529" name="Constant_386664" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="792684080" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="7530" name="Reshape_386665" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="7531" name="__module.model.layers.31.self_attn.o_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="7532" name="__module.model.layers.31.self_attn.o_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5516,5518,hidden_states.947"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="7533" name="__module.model.layers.31/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5521,5523,5534,hidden_states.949,hidden_states.951"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="7534" name="Constant_290367" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 5120" offset="5246529656" size="20480" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="7535" name="Constant_290366" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064860" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7536" name="Constant_290364" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064864" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7537" name="__module.model.layers.31.post_attention_layernorm/aten::pow/Power" type="Power" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5524"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="7538" name="Constant_21956" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64" names="5525"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7539" name="__module.model.layers.31.post_attention_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> + <data keep_dims="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5526,variance.127"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7540" name="Constant_290365" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064876" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7541" name="__module.model.layers.31.post_attention_layernorm/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5527"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7542" name="__module.model.layers.31.post_attention_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7543" name="__module.model.layers.31.post_attention_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5528"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7544" name="__module.model.layers.31.post_attention_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5529,5530,hidden_states.953,hidden_states.955"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="7545" name="__module.model.layers.31.post_attention_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5531,5533"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="7546" name="self.model.layers.31.mlp.gate_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 128" offset="5246550136" size="35389440" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7547" name="Convert_385527" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7548" name="self.model.layers.31.mlp.gate_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 1" offset="5281939576" size="276480" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7549" name="Convert_385529" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7550" name="self.model.layers.31.mlp.gate_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7551" name="self.model.layers.31.mlp.gate_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="13824, 40, 1" offset="5282216056" size="1105920" /> + <output> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7552" name="self.model.layers.31.mlp.gate_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7553" name="Constant_385534" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="848558152" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="7554" name="Reshape_385535" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="7555" name="__module.model.layers.31.mlp.gate_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="7556" name="__module.model.layers.31.mlp.gate_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5539,input.63"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="7557" name="__module.model.layers.31.mlp.act_fn/aten::silu/Swish" type="Swish" version="opset4"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="5540"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="7558" name="self.model.layers.31.mlp.up_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 128" offset="5283321976" size="35389440" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7559" name="Convert_385517" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7560" name="self.model.layers.31.mlp.up_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 1" offset="5318711416" size="276480" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7561" name="Convert_385519" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7562" name="self.model.layers.31.mlp.up_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7563" name="self.model.layers.31.mlp.up_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="13824, 40, 1" offset="5318987896" size="1105920" /> + <output> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7564" name="self.model.layers.31.mlp.up_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7565" name="Constant_385524" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="848558152" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="7566" name="Reshape_385525" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="7567" name="__module.model.layers.31.mlp.up_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="7568" name="__module.model.layers.31.mlp.up_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5542"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="7569" name="__module.model.layers.31.mlp/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5543"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="7570" name="self.model.layers.31.mlp.down_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 108, 128" offset="5320093816" size="35389440" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7571" name="Convert_385537" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7572" name="self.model.layers.31.mlp.down_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 108, 1" offset="5355483256" size="276480" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7573" name="Convert_385539" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7574" name="self.model.layers.31.mlp.down_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7575" name="self.model.layers.31.mlp.down_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="5120, 108, 1" offset="5355759736" size="1105920" /> + <output> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7576" name="self.model.layers.31.mlp.down_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7577" name="Constant_385544" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="922101848" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="7578" name="Reshape_385545" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="7579" name="__module.model.layers.31.mlp.down_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="7580" name="__module.model.layers.31.mlp.down_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5545,hidden_states.957"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="7581" name="__module.model.layers.31/aten::add/Add_1" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5546,5548,5556,5567,hidden_states.959,hidden_states.961"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="7582" name="Constant_290371" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 5120" offset="5356865656" size="20480" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="7583" name="Constant_290370" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064860" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7584" name="Constant_290368" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064864" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7585" name="__module.model.layers.32.input_layernorm/aten::pow/Power" type="Power" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5557"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="7586" name="Constant_22030" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64" names="5558"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7587" name="__module.model.layers.32.input_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> + <data keep_dims="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5559,variance.129"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7588" name="Constant_290369" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064876" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7589" name="__module.model.layers.32.input_layernorm/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5560"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7590" name="__module.model.layers.32.input_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7591" name="__module.model.layers.32.input_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5561"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7592" name="__module.model.layers.32.input_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5562,5563,hidden_states.963,hidden_states.965"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="7593" name="__module.model.layers.32.input_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5564,5566,hidden_states.967"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="7594" name="self.model.layers.32.self_attn.q_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 128" offset="5356886136" size="13107200" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7595" name="Convert_386667" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7596" name="self.model.layers.32.self_attn.q_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 1" offset="5369993336" size="102400" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7597" name="Convert_386669" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7598" name="self.model.layers.32.self_attn.q_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7599" name="self.model.layers.32.self_attn.q_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="5120, 40, 1" offset="5370095736" size="409600" /> + <output> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7600" name="self.model.layers.32.self_attn.q_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7601" name="Constant_386674" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="792684080" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="7602" name="Reshape_386675" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="7603" name="__module.model.layers.32.self_attn.q_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="7604" name="__module.model.layers.32.self_attn.q_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="7605" name="self.model.layers.32.self_attn.q_proj.bias" type="Const" version="opset1"> + <data element_type="bf16" shape="5120" offset="5370505336" size="10240" /> + <output> + <port id="0" precision="BF16" names="self.model.layers.32.self_attn.q_proj.bias"> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="7606" name="__module.model.layers.32.self_attn.q_proj/prim::PythonOp/ConvertLike_1" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="BF16"> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="7607" name="__module.model.layers.32.self_attn.q_proj/prim::PythonOp/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5576,query_states.65"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="7608" name="Constant_301889" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="792694336" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="7609" name="__module.model.layers.32.self_attn/aten::view/Reshape" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5584"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7610" name="__module.model.layers.32.self_attn/aten::transpose/ScatterElementsUpdate" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="7611" name="__module.model.layers.32.self_attn/aten::transpose/Transpose" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5585,q.65"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7612" name="__module.model.layers.32.self_attn/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5594"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7613" name="__module.model.layers.32.self_attn/aten::size/ShapeOf_3" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="7614" name="__module.model.layers.32.self_attn/aten::size/Constant_3" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="7615" name="__module.model.layers.32.self_attn/aten::size/Gather_3" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="5595,5600" /> + </output> + </layer> + <layer id="7616" name="__module.model.layers.32.self_attn/aten::floor_divide/Divide_1" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" /> + </output> + </layer> + <layer id="7617" name="__module.model.layers.32.self_attn/aten::floor_divide/Floor_1" type="Floor" version="opset1"> + <input> + <port id="0" precision="I64" /> + </input> + <output> + <port id="1" precision="I64" names="5597,5598,5602,5603" /> + </output> + </layer> + <layer id="7618" name="Constant_221025" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7619" name="__module.model.layers.32.self_attn/aten::slice/Reshape_5" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7620" name="__module.model.layers.32.self_attn/aten::slice/Reshape_1" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694676" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7621" name="__module.model.layers.32.self_attn/aten::slice/Reshape_2" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7622" name="__module.model.layers.32.self_attn/aten::slice/Reshape_3" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7623" name="__module.model.layers.32.self_attn/aten::slice/Slice" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="5604,x2.129"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="7624" name="Constant_290372" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1, 1" offset="792694684" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7625" name="__module.model.layers.32.self_attn/aten::neg/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5605"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="7626" name="__module.model.layers.32.self_attn/aten::slice/Reshape_4" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7627" name="__module.model.layers.32.self_attn/aten::slice/Reshape_6" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7628" name="__module.model.layers.32.self_attn/aten::slice/Reshape_7" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7629" name="__module.model.layers.32.self_attn/aten::slice/Slice_1" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="5599"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="7630" name="__module.model.layers.32.self_attn/aten::cat/Concat" type="Concat" version="opset1"> + <data axis="-1" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5607"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7631" name="__module.model.layers.32.self_attn/aten::mul/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5608"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7632" name="__module.model.layers.32.self_attn/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5609"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7633" name="Constant_341607" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="7634" name="Constant_341600" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="12" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7635" name="Constant_341602" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7636" name="Constant_341604" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="20" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7637" name="Concat_341605" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="7638" name="Broadcast_341608" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32" /> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7639" name="ReadValue_333180" type="ReadValue" version="opset6"> + <data variable_id="past_key_values.32.keypresent.32.key" variable_type="f32" variable_shape="?,8,?,128" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="past_key_values.32.key"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7640" name="Constant_325501" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="7641" name="Gather_325502" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7642" name="self.model.layers.32.self_attn.k_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 128" offset="5370515576" size="2621440" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7643" name="Convert_387627" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7644" name="self.model.layers.32.self_attn.k_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 1" offset="5373137016" size="20480" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7645" name="Convert_387629" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7646" name="self.model.layers.32.self_attn.k_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7647" name="self.model.layers.32.self_attn.k_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="1024, 40, 1" offset="5373157496" size="81920" /> + <output> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7648" name="self.model.layers.32.self_attn.k_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7649" name="Constant_387634" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795418528" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="7650" name="Reshape_387635" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="7651" name="__module.model.layers.32.self_attn.k_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="7652" name="__module.model.layers.32.self_attn.k_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="7653" name="self.model.layers.32.self_attn.k_proj.bias" type="Const" version="opset1"> + <data element_type="bf16" shape="1024" offset="5373239416" size="2048" /> + <output> + <port id="0" precision="BF16" names="self.model.layers.32.self_attn.k_proj.bias"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="7654" name="__module.model.layers.32.self_attn.k_proj/prim::PythonOp/ConvertLike_1" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="BF16"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="7655" name="__module.model.layers.32.self_attn.k_proj/prim::PythonOp/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5579,key_states.133"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="7656" name="Constant_301890" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420592" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="7657" name="__module.model.layers.32.self_attn/aten::view/Reshape_1" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5587"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7658" name="__module.model.layers.32.self_attn/aten::transpose/ScatterElementsUpdate_1" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="7659" name="__module.model.layers.32.self_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5588,k.65"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7660" name="__module.model.layers.32.self_attn/aten::mul/Multiply_2" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5610"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7661" name="__module.model.layers.32.self_attn/aten::size/ShapeOf_5" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="7662" name="__module.model.layers.32.self_attn/aten::size/Constant_5" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="7663" name="__module.model.layers.32.self_attn/aten::size/Gather_5" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="5611,5616" /> + </output> + </layer> + <layer id="7664" name="__module.model.layers.32.self_attn/aten::floor_divide/Divide_3" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" /> + </output> + </layer> + <layer id="7665" name="__module.model.layers.32.self_attn/aten::floor_divide/Floor_3" type="Floor" version="opset1"> + <input> + <port id="0" precision="I64" /> + </input> + <output> + <port id="1" precision="I64" names="5613,5614,5618,5619" /> + </output> + </layer> + <layer id="7666" name="Constant_221026" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7667" name="__module.model.layers.32.self_attn/aten::slice/Reshape_13" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7668" name="__module.model.layers.32.self_attn/aten::slice/Reshape_9" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694676" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7669" name="__module.model.layers.32.self_attn/aten::slice/Reshape_10" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7670" name="__module.model.layers.32.self_attn/aten::slice/Reshape_11" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7671" name="__module.model.layers.32.self_attn/aten::slice/Slice_2" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="5620,x2.131"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="7672" name="Constant_290373" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1, 1" offset="792694684" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7673" name="__module.model.layers.32.self_attn/aten::neg/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5621"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="7674" name="__module.model.layers.32.self_attn/aten::slice/Reshape_12" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7675" name="__module.model.layers.32.self_attn/aten::slice/Reshape_14" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7676" name="__module.model.layers.32.self_attn/aten::slice/Reshape_15" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7677" name="__module.model.layers.32.self_attn/aten::slice/Slice_3" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="5615"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="7678" name="__module.model.layers.32.self_attn/aten::cat/Concat_1" type="Concat" version="opset1"> + <data axis="-1" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5623"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7679" name="__module.model.layers.32.self_attn/aten::mul/Multiply_3" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5624"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7680" name="__module.model.layers.32.self_attn/aten::add/Add_1" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5625"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7681" name="__module.model.layers.32.self_attn/aten::cat/Concat_2" type="Concat" version="opset1"> + <data axis="-2" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="present.32.key"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7682" name="__module.model.layers.32.self_attn/aten::unsqueeze/Unsqueeze_2" type="Unsqueeze" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="FP32" names="5637,5638,5639"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7683" name="__module.model.layers.32.self_attn/aten::size/ShapeOf_6" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="7684" name="Constant_302524" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="938477672" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="7685" name="Constant_302525" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="7686" name="Gather_302526" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="7687" name="Constant_268986" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="795420624" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7688" name="Constant_277311" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795420632" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="7689" name="Constant_277312" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="7690" name="Gather_277313" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="7691" name="__module.model.layers.32.self_attn/prim::ListConstruct/Concat_2" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="3" precision="I64" names="5640"> + <dim>5</dim> + </port> + </output> + </layer> + <layer id="7692" name="__module.model.layers.32.self_attn/aten::expand/Broadcast" type="Broadcast" version="opset3"> + <data mode="bidirectional" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>5</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5641,hidden_states.971"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7693" name="Constant_301891" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420648" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="7694" name="__module.model.layers.32.self_attn/aten::reshape/Reshape" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5645,key_states.135"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7695" name="Constant_341620" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="7696" name="Constant_341613" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="12" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7697" name="Constant_341615" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7698" name="Constant_341617" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="20" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7699" name="Concat_341618" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="7700" name="Broadcast_341621" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32" /> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7701" name="ReadValue_333182" type="ReadValue" version="opset6"> + <data variable_id="past_key_values.32.valuepresent.32.value" variable_type="f32" variable_shape="?,8,?,128" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="past_key_values.32.value"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7702" name="Constant_325504" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="7703" name="Gather_325505" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7704" name="self.model.layers.32.self_attn.v_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 128" offset="5373241464" size="2621440" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7705" name="Convert_387637" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7706" name="self.model.layers.32.self_attn.v_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 1" offset="5375862904" size="20480" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7707" name="Convert_387639" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7708" name="self.model.layers.32.self_attn.v_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7709" name="self.model.layers.32.self_attn.v_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="1024, 40, 1" offset="5375883384" size="81920" /> + <output> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7710" name="self.model.layers.32.self_attn.v_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7711" name="Constant_387644" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795418528" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="7712" name="Reshape_387645" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="7713" name="__module.model.layers.32.self_attn.v_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="7714" name="__module.model.layers.32.self_attn.v_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="7715" name="self.model.layers.32.self_attn.v_proj.bias" type="Const" version="opset1"> + <data element_type="bf16" shape="1024" offset="5375965304" size="2048" /> + <output> + <port id="0" precision="BF16" names="self.model.layers.32.self_attn.v_proj.bias"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="7716" name="__module.model.layers.32.self_attn.v_proj/prim::PythonOp/ConvertLike_1" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="BF16"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="7717" name="__module.model.layers.32.self_attn.v_proj/prim::PythonOp/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5582,value_states.65"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="7718" name="Constant_301892" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420592" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="7719" name="__module.model.layers.32.self_attn/aten::view/Reshape_2" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5590"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7720" name="__module.model.layers.32.self_attn/aten::transpose/ScatterElementsUpdate_2" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="7721" name="__module.model.layers.32.self_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5591"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7722" name="__module.model.layers.32.self_attn/aten::cat/Concat_3" type="Concat" version="opset1"> + <data axis="-2" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="present.32.value"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7723" name="__module.model.layers.32.self_attn/aten::unsqueeze/Unsqueeze_3" type="Unsqueeze" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="FP32" names="5653,5654,5655"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7724" name="__module.model.layers.32.self_attn/aten::size/ShapeOf_10" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="7725" name="Constant_302277" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7726" name="__module.model.layers.32.self_attn/aten::size/Constant_11" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="7727" name="__module.model.layers.32.self_attn/aten::size/Gather_11" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="5647"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7728" name="Constant_269004" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="795420624" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7729" name="Constant_277321" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795420632" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="7730" name="Constant_277322" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="7731" name="Gather_277323" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="7732" name="__module.model.layers.32.self_attn/prim::ListConstruct/Concat_5" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="4" precision="I64" names="5656"> + <dim>5</dim> + </port> + </output> + </layer> + <layer id="7733" name="__module.model.layers.32.self_attn/aten::expand/Broadcast_1" type="Broadcast" version="opset3"> + <data mode="bidirectional" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>5</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5657,hidden_states.975"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7734" name="Constant_301893" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420648" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="7735" name="__module.model.layers.32.self_attn/aten::reshape/Reshape_1" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5661"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7736" name="__module.model.layers.32.self_attn/aten::slice/Reshape_60" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7737" name="ShapeOf_300332" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="7738" name="Constant_300333" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694668" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7739" name="Constant_300334" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="7740" name="Gather_300335" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7741" name="ShapeOf_300336" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="7742" name="Constant_300337" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694668" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7743" name="Constant_300338" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="7744" name="Gather_300339" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7745" name="Add_300340" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64" names="5662"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7746" name="__module.model.layers.32.self_attn/aten::slice/Reshape_62" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7747" name="__module.model.layers.32.self_attn/aten::slice/Reshape_63" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7748" name="__module.model.layers.32.self_attn/aten::slice/Slice_15" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="5666"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="7749" name="__module.model.layers.32.self_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> + <data causal="false" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="5667,attn_output.129"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7750" name="__module.model.layers.32.self_attn/aten::transpose/ScatterElementsUpdate_3" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="7751" name="__module.model.layers.32.self_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5668"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7752" name="Constant_301894" type="Const" version="opset1"> + <data element_type="i64" shape="3" offset="798146608" size="24" /> + <output> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="7753" name="__module.model.layers.32.self_attn/aten::view/Reshape_3" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>3</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5671"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="7754" name="self.model.layers.32.self_attn.o_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 128" offset="5375967352" size="13107200" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7755" name="Convert_386677" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7756" name="self.model.layers.32.self_attn.o_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 1" offset="5389074552" size="102400" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7757" name="Convert_386679" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7758" name="self.model.layers.32.self_attn.o_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7759" name="self.model.layers.32.self_attn.o_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="5120, 40, 1" offset="5389176952" size="409600" /> + <output> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7760" name="self.model.layers.32.self_attn.o_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7761" name="Constant_386684" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="792684080" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="7762" name="Reshape_386685" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="7763" name="__module.model.layers.32.self_attn.o_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="7764" name="__module.model.layers.32.self_attn.o_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5673,5675,hidden_states.977"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="7765" name="__module.model.layers.32/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5678,5680,5691,hidden_states.979,hidden_states.981"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="7766" name="Constant_290377" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 5120" offset="5389586552" size="20480" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="7767" name="Constant_290376" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064860" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7768" name="Constant_290374" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064864" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7769" name="__module.model.layers.32.post_attention_layernorm/aten::pow/Power" type="Power" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5681"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="7770" name="Constant_22628" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64" names="5682"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7771" name="__module.model.layers.32.post_attention_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> + <data keep_dims="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5683,variance.131"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7772" name="Constant_290375" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064876" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7773" name="__module.model.layers.32.post_attention_layernorm/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5684"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7774" name="__module.model.layers.32.post_attention_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7775" name="__module.model.layers.32.post_attention_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5685"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7776" name="__module.model.layers.32.post_attention_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5686,5687,hidden_states.983,hidden_states.985"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="7777" name="__module.model.layers.32.post_attention_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5688,5690"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="7778" name="self.model.layers.32.mlp.gate_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 128" offset="5389607032" size="35389440" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7779" name="Convert_385557" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7780" name="self.model.layers.32.mlp.gate_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 1" offset="5424996472" size="276480" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7781" name="Convert_385559" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7782" name="self.model.layers.32.mlp.gate_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7783" name="self.model.layers.32.mlp.gate_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="13824, 40, 1" offset="5425272952" size="1105920" /> + <output> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7784" name="self.model.layers.32.mlp.gate_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7785" name="Constant_385564" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="848558152" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="7786" name="Reshape_385565" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="7787" name="__module.model.layers.32.mlp.gate_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="7788" name="__module.model.layers.32.mlp.gate_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5696,input.65"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="7789" name="__module.model.layers.32.mlp.act_fn/aten::silu/Swish" type="Swish" version="opset4"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="5697"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="7790" name="self.model.layers.32.mlp.up_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 128" offset="5426378872" size="35389440" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7791" name="Convert_385547" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7792" name="self.model.layers.32.mlp.up_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 1" offset="5461768312" size="276480" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7793" name="Convert_385549" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7794" name="self.model.layers.32.mlp.up_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7795" name="self.model.layers.32.mlp.up_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="13824, 40, 1" offset="5462044792" size="1105920" /> + <output> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7796" name="self.model.layers.32.mlp.up_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7797" name="Constant_385554" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="848558152" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="7798" name="Reshape_385555" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="7799" name="__module.model.layers.32.mlp.up_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="7800" name="__module.model.layers.32.mlp.up_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5699"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="7801" name="__module.model.layers.32.mlp/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5700"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="7802" name="self.model.layers.32.mlp.down_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 108, 128" offset="5463150712" size="35389440" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7803" name="Convert_385567" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7804" name="self.model.layers.32.mlp.down_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 108, 1" offset="5498540152" size="276480" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7805" name="Convert_385569" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7806" name="self.model.layers.32.mlp.down_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7807" name="self.model.layers.32.mlp.down_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="5120, 108, 1" offset="5498816632" size="1105920" /> + <output> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7808" name="self.model.layers.32.mlp.down_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7809" name="Constant_385574" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="922101848" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="7810" name="Reshape_385575" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="7811" name="__module.model.layers.32.mlp.down_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="7812" name="__module.model.layers.32.mlp.down_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5702,hidden_states.987"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="7813" name="__module.model.layers.32/aten::add/Add_1" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5703,5705,5713,5724,hidden_states.989,hidden_states.991"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="7814" name="Constant_290381" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 5120" offset="5499922552" size="20480" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="7815" name="Constant_290380" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064860" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7816" name="Constant_290378" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064864" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7817" name="__module.model.layers.33.input_layernorm/aten::pow/Power" type="Power" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5714"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="7818" name="Constant_22702" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64" names="5715"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7819" name="__module.model.layers.33.input_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> + <data keep_dims="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5716,variance.133"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7820" name="Constant_290379" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064876" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7821" name="__module.model.layers.33.input_layernorm/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5717"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7822" name="__module.model.layers.33.input_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7823" name="__module.model.layers.33.input_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5718"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7824" name="__module.model.layers.33.input_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5719,5720,hidden_states.993,hidden_states.995"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="7825" name="__module.model.layers.33.input_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5721,5723,hidden_states.997"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="7826" name="self.model.layers.33.self_attn.q_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 128" offset="5499943032" size="13107200" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7827" name="Convert_386687" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7828" name="self.model.layers.33.self_attn.q_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 1" offset="5513050232" size="102400" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7829" name="Convert_386689" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7830" name="self.model.layers.33.self_attn.q_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7831" name="self.model.layers.33.self_attn.q_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="5120, 40, 1" offset="5513152632" size="409600" /> + <output> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7832" name="self.model.layers.33.self_attn.q_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7833" name="Constant_386694" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="792684080" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="7834" name="Reshape_386695" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="7835" name="__module.model.layers.33.self_attn.q_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="7836" name="__module.model.layers.33.self_attn.q_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="7837" name="self.model.layers.33.self_attn.q_proj.bias" type="Const" version="opset1"> + <data element_type="bf16" shape="5120" offset="5513562232" size="10240" /> + <output> + <port id="0" precision="BF16" names="self.model.layers.33.self_attn.q_proj.bias"> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="7838" name="__module.model.layers.33.self_attn.q_proj/prim::PythonOp/ConvertLike_1" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="BF16"> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="7839" name="__module.model.layers.33.self_attn.q_proj/prim::PythonOp/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5733,query_states.67"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="7840" name="Constant_301895" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="792694336" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="7841" name="__module.model.layers.33.self_attn/aten::view/Reshape" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5741"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7842" name="__module.model.layers.33.self_attn/aten::transpose/ScatterElementsUpdate" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="7843" name="__module.model.layers.33.self_attn/aten::transpose/Transpose" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5742,q.67"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7844" name="__module.model.layers.33.self_attn/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5751"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7845" name="__module.model.layers.33.self_attn/aten::size/ShapeOf_3" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="7846" name="__module.model.layers.33.self_attn/aten::size/Constant_3" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="7847" name="__module.model.layers.33.self_attn/aten::size/Gather_3" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="5752,5757" /> + </output> + </layer> + <layer id="7848" name="__module.model.layers.33.self_attn/aten::floor_divide/Divide_1" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" /> + </output> + </layer> + <layer id="7849" name="__module.model.layers.33.self_attn/aten::floor_divide/Floor_1" type="Floor" version="opset1"> + <input> + <port id="0" precision="I64" /> + </input> + <output> + <port id="1" precision="I64" names="5754,5755,5759,5760" /> + </output> + </layer> + <layer id="7850" name="Constant_221040" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7851" name="__module.model.layers.33.self_attn/aten::slice/Reshape_5" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7852" name="__module.model.layers.33.self_attn/aten::slice/Reshape_1" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694676" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7853" name="__module.model.layers.33.self_attn/aten::slice/Reshape_2" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7854" name="__module.model.layers.33.self_attn/aten::slice/Reshape_3" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7855" name="__module.model.layers.33.self_attn/aten::slice/Slice" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="5761,x2.133"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="7856" name="Constant_290382" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1, 1" offset="792694684" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7857" name="__module.model.layers.33.self_attn/aten::neg/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5762"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="7858" name="__module.model.layers.33.self_attn/aten::slice/Reshape_4" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7859" name="__module.model.layers.33.self_attn/aten::slice/Reshape_6" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7860" name="__module.model.layers.33.self_attn/aten::slice/Reshape_7" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7861" name="__module.model.layers.33.self_attn/aten::slice/Slice_1" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="5756"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="7862" name="__module.model.layers.33.self_attn/aten::cat/Concat" type="Concat" version="opset1"> + <data axis="-1" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5764"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7863" name="__module.model.layers.33.self_attn/aten::mul/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5765"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7864" name="__module.model.layers.33.self_attn/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5766"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7865" name="Constant_341633" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="7866" name="Constant_341626" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="12" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7867" name="Constant_341628" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7868" name="Constant_341630" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="20" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7869" name="Concat_341631" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="7870" name="Broadcast_341634" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32" /> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7871" name="ReadValue_333184" type="ReadValue" version="opset6"> + <data variable_id="past_key_values.33.keypresent.33.key" variable_type="f32" variable_shape="?,8,?,128" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="past_key_values.33.key"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7872" name="Constant_325507" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="7873" name="Gather_325508" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7874" name="self.model.layers.33.self_attn.k_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 128" offset="5513572472" size="2621440" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7875" name="Convert_387647" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7876" name="self.model.layers.33.self_attn.k_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 1" offset="5516193912" size="20480" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7877" name="Convert_387649" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7878" name="self.model.layers.33.self_attn.k_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7879" name="self.model.layers.33.self_attn.k_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="1024, 40, 1" offset="5516214392" size="81920" /> + <output> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7880" name="self.model.layers.33.self_attn.k_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7881" name="Constant_387654" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795418528" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="7882" name="Reshape_387655" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="7883" name="__module.model.layers.33.self_attn.k_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="7884" name="__module.model.layers.33.self_attn.k_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="7885" name="self.model.layers.33.self_attn.k_proj.bias" type="Const" version="opset1"> + <data element_type="bf16" shape="1024" offset="5516296312" size="2048" /> + <output> + <port id="0" precision="BF16" names="self.model.layers.33.self_attn.k_proj.bias"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="7886" name="__module.model.layers.33.self_attn.k_proj/prim::PythonOp/ConvertLike_1" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="BF16"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="7887" name="__module.model.layers.33.self_attn.k_proj/prim::PythonOp/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5736,key_states.137"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="7888" name="Constant_301896" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420592" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="7889" name="__module.model.layers.33.self_attn/aten::view/Reshape_1" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5744"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7890" name="__module.model.layers.33.self_attn/aten::transpose/ScatterElementsUpdate_1" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="7891" name="__module.model.layers.33.self_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5745,k.67"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7892" name="__module.model.layers.33.self_attn/aten::mul/Multiply_2" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5767"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7893" name="__module.model.layers.33.self_attn/aten::size/ShapeOf_5" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="7894" name="__module.model.layers.33.self_attn/aten::size/Constant_5" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="7895" name="__module.model.layers.33.self_attn/aten::size/Gather_5" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="5768,5773" /> + </output> + </layer> + <layer id="7896" name="__module.model.layers.33.self_attn/aten::floor_divide/Divide_3" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" /> + </output> + </layer> + <layer id="7897" name="__module.model.layers.33.self_attn/aten::floor_divide/Floor_3" type="Floor" version="opset1"> + <input> + <port id="0" precision="I64" /> + </input> + <output> + <port id="1" precision="I64" names="5770,5771,5775,5776" /> + </output> + </layer> + <layer id="7898" name="Constant_221041" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7899" name="__module.model.layers.33.self_attn/aten::slice/Reshape_13" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7900" name="__module.model.layers.33.self_attn/aten::slice/Reshape_9" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694676" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7901" name="__module.model.layers.33.self_attn/aten::slice/Reshape_10" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7902" name="__module.model.layers.33.self_attn/aten::slice/Reshape_11" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7903" name="__module.model.layers.33.self_attn/aten::slice/Slice_2" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="5777,x2.135"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="7904" name="Constant_290383" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1, 1" offset="792694684" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7905" name="__module.model.layers.33.self_attn/aten::neg/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5778"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="7906" name="__module.model.layers.33.self_attn/aten::slice/Reshape_12" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7907" name="__module.model.layers.33.self_attn/aten::slice/Reshape_14" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7908" name="__module.model.layers.33.self_attn/aten::slice/Reshape_15" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7909" name="__module.model.layers.33.self_attn/aten::slice/Slice_3" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="5772"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="7910" name="__module.model.layers.33.self_attn/aten::cat/Concat_1" type="Concat" version="opset1"> + <data axis="-1" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5780"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7911" name="__module.model.layers.33.self_attn/aten::mul/Multiply_3" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5781"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7912" name="__module.model.layers.33.self_attn/aten::add/Add_1" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5782"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7913" name="__module.model.layers.33.self_attn/aten::cat/Concat_2" type="Concat" version="opset1"> + <data axis="-2" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="present.33.key"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7914" name="__module.model.layers.33.self_attn/aten::unsqueeze/Unsqueeze_2" type="Unsqueeze" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="FP32" names="5794,5795,5796"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7915" name="__module.model.layers.33.self_attn/aten::size/ShapeOf_6" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="7916" name="Constant_302529" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="938477672" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="7917" name="Constant_302530" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="7918" name="Gather_302531" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="7919" name="Constant_269022" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="795420624" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7920" name="Constant_277346" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795420632" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="7921" name="Constant_277347" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="7922" name="Gather_277348" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="7923" name="__module.model.layers.33.self_attn/prim::ListConstruct/Concat_2" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="3" precision="I64" names="5797"> + <dim>5</dim> + </port> + </output> + </layer> + <layer id="7924" name="__module.model.layers.33.self_attn/aten::expand/Broadcast" type="Broadcast" version="opset3"> + <data mode="bidirectional" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>5</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5798,hidden_states.1001"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7925" name="Constant_301897" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420648" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="7926" name="__module.model.layers.33.self_attn/aten::reshape/Reshape" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5802,key_states.139"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7927" name="Constant_341646" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="7928" name="Constant_341639" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="12" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7929" name="Constant_341641" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7930" name="Constant_341643" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="20" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7931" name="Concat_341644" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="7932" name="Broadcast_341647" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32" /> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7933" name="ReadValue_333186" type="ReadValue" version="opset6"> + <data variable_id="past_key_values.33.valuepresent.33.value" variable_type="f32" variable_shape="?,8,?,128" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="past_key_values.33.value"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7934" name="Constant_325510" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="7935" name="Gather_325511" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7936" name="self.model.layers.33.self_attn.v_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 128" offset="5516298360" size="2621440" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7937" name="Convert_387657" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7938" name="self.model.layers.33.self_attn.v_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 1" offset="5518919800" size="20480" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7939" name="Convert_387659" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7940" name="self.model.layers.33.self_attn.v_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7941" name="self.model.layers.33.self_attn.v_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="1024, 40, 1" offset="5518940280" size="81920" /> + <output> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7942" name="self.model.layers.33.self_attn.v_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7943" name="Constant_387664" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795418528" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="7944" name="Reshape_387665" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="7945" name="__module.model.layers.33.self_attn.v_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="7946" name="__module.model.layers.33.self_attn.v_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="7947" name="self.model.layers.33.self_attn.v_proj.bias" type="Const" version="opset1"> + <data element_type="bf16" shape="1024" offset="5519022200" size="2048" /> + <output> + <port id="0" precision="BF16" names="self.model.layers.33.self_attn.v_proj.bias"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="7948" name="__module.model.layers.33.self_attn.v_proj/prim::PythonOp/ConvertLike_1" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="BF16"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="7949" name="__module.model.layers.33.self_attn.v_proj/prim::PythonOp/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5739,value_states.67"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="7950" name="Constant_301898" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420592" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="7951" name="__module.model.layers.33.self_attn/aten::view/Reshape_2" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5747"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7952" name="__module.model.layers.33.self_attn/aten::transpose/ScatterElementsUpdate_2" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="7953" name="__module.model.layers.33.self_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5748"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7954" name="__module.model.layers.33.self_attn/aten::cat/Concat_3" type="Concat" version="opset1"> + <data axis="-2" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="present.33.value"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7955" name="__module.model.layers.33.self_attn/aten::unsqueeze/Unsqueeze_3" type="Unsqueeze" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="FP32" names="5810,5811,5812"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7956" name="__module.model.layers.33.self_attn/aten::size/ShapeOf_10" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="7957" name="Constant_302283" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7958" name="__module.model.layers.33.self_attn/aten::size/Constant_11" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="7959" name="__module.model.layers.33.self_attn/aten::size/Gather_11" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="5804"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7960" name="Constant_269040" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="795420624" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7961" name="Constant_277356" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795420632" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="7962" name="Constant_277357" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="7963" name="Gather_277358" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="7964" name="__module.model.layers.33.self_attn/prim::ListConstruct/Concat_5" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="4" precision="I64" names="5813"> + <dim>5</dim> + </port> + </output> + </layer> + <layer id="7965" name="__module.model.layers.33.self_attn/aten::expand/Broadcast_1" type="Broadcast" version="opset3"> + <data mode="bidirectional" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>5</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5814,hidden_states.1005"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7966" name="Constant_301899" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420648" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="7967" name="__module.model.layers.33.self_attn/aten::reshape/Reshape_1" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5818"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7968" name="__module.model.layers.33.self_attn/aten::slice/Reshape_60" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7969" name="ShapeOf_300418" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="7970" name="Constant_300419" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694668" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7971" name="Constant_300420" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="7972" name="Gather_300421" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7973" name="ShapeOf_300422" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="7974" name="Constant_300423" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694668" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7975" name="Constant_300424" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="7976" name="Gather_300425" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7977" name="Add_300426" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64" names="5819"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7978" name="__module.model.layers.33.self_attn/aten::slice/Reshape_62" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7979" name="__module.model.layers.33.self_attn/aten::slice/Reshape_63" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7980" name="__module.model.layers.33.self_attn/aten::slice/Slice_15" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="5823"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="7981" name="__module.model.layers.33.self_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> + <data causal="false" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="5824,attn_output.133"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7982" name="__module.model.layers.33.self_attn/aten::transpose/ScatterElementsUpdate_3" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="7983" name="__module.model.layers.33.self_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5825"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7984" name="Constant_301900" type="Const" version="opset1"> + <data element_type="i64" shape="3" offset="798146608" size="24" /> + <output> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="7985" name="__module.model.layers.33.self_attn/aten::view/Reshape_3" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>3</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5828"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="7986" name="self.model.layers.33.self_attn.o_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 128" offset="5519024248" size="13107200" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7987" name="Convert_386697" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7988" name="self.model.layers.33.self_attn.o_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 1" offset="5532131448" size="102400" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7989" name="Convert_386699" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7990" name="self.model.layers.33.self_attn.o_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7991" name="self.model.layers.33.self_attn.o_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="5120, 40, 1" offset="5532233848" size="409600" /> + <output> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="7992" name="self.model.layers.33.self_attn.o_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="7993" name="Constant_386704" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="792684080" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="7994" name="Reshape_386705" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="7995" name="__module.model.layers.33.self_attn.o_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="7996" name="__module.model.layers.33.self_attn.o_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5830,5832,hidden_states.1007"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="7997" name="__module.model.layers.33/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5835,5837,5848,hidden_states.1009,hidden_states.1011"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="7998" name="Constant_290387" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 5120" offset="5532643448" size="20480" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="7999" name="Constant_290386" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064860" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8000" name="Constant_290384" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064864" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8001" name="__module.model.layers.33.post_attention_layernorm/aten::pow/Power" type="Power" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5838"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="8002" name="Constant_23300" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64" names="5839"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8003" name="__module.model.layers.33.post_attention_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> + <data keep_dims="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5840,variance.135"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8004" name="Constant_290385" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064876" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8005" name="__module.model.layers.33.post_attention_layernorm/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5841"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8006" name="__module.model.layers.33.post_attention_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8007" name="__module.model.layers.33.post_attention_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5842"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8008" name="__module.model.layers.33.post_attention_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5843,5844,hidden_states.1013,hidden_states.1015"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="8009" name="__module.model.layers.33.post_attention_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5845,5847"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="8010" name="self.model.layers.33.mlp.gate_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 128" offset="5532663928" size="35389440" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8011" name="Convert_385587" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8012" name="self.model.layers.33.mlp.gate_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 1" offset="5568053368" size="276480" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8013" name="Convert_385589" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8014" name="self.model.layers.33.mlp.gate_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8015" name="self.model.layers.33.mlp.gate_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="13824, 40, 1" offset="5568329848" size="1105920" /> + <output> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8016" name="self.model.layers.33.mlp.gate_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8017" name="Constant_385594" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="848558152" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="8018" name="Reshape_385595" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="8019" name="__module.model.layers.33.mlp.gate_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="8020" name="__module.model.layers.33.mlp.gate_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5853,input.67"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="8021" name="__module.model.layers.33.mlp.act_fn/aten::silu/Swish" type="Swish" version="opset4"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="5854"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="8022" name="self.model.layers.33.mlp.up_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 128" offset="5569435768" size="35389440" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8023" name="Convert_385577" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8024" name="self.model.layers.33.mlp.up_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 1" offset="5604825208" size="276480" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8025" name="Convert_385579" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8026" name="self.model.layers.33.mlp.up_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8027" name="self.model.layers.33.mlp.up_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="13824, 40, 1" offset="5605101688" size="1105920" /> + <output> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8028" name="self.model.layers.33.mlp.up_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8029" name="Constant_385584" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="848558152" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="8030" name="Reshape_385585" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="8031" name="__module.model.layers.33.mlp.up_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="8032" name="__module.model.layers.33.mlp.up_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5856"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="8033" name="__module.model.layers.33.mlp/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5857"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="8034" name="self.model.layers.33.mlp.down_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 108, 128" offset="5606207608" size="35389440" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8035" name="Convert_385597" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8036" name="self.model.layers.33.mlp.down_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 108, 1" offset="5641597048" size="276480" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8037" name="Convert_385599" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8038" name="self.model.layers.33.mlp.down_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8039" name="self.model.layers.33.mlp.down_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="5120, 108, 1" offset="5641873528" size="1105920" /> + <output> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8040" name="self.model.layers.33.mlp.down_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8041" name="Constant_385604" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="922101848" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="8042" name="Reshape_385605" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="8043" name="__module.model.layers.33.mlp.down_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="8044" name="__module.model.layers.33.mlp.down_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5859,hidden_states.1017"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="8045" name="__module.model.layers.33/aten::add/Add_1" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5860,5862,5870,5881,hidden_states.1019,hidden_states.1021"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="8046" name="Constant_290391" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 5120" offset="5642979448" size="20480" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="8047" name="Constant_290390" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064860" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8048" name="Constant_290388" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064864" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8049" name="__module.model.layers.34.input_layernorm/aten::pow/Power" type="Power" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5871"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="8050" name="Constant_23374" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64" names="5872"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8051" name="__module.model.layers.34.input_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> + <data keep_dims="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5873,variance.137"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8052" name="Constant_290389" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064876" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8053" name="__module.model.layers.34.input_layernorm/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5874"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8054" name="__module.model.layers.34.input_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8055" name="__module.model.layers.34.input_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5875"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8056" name="__module.model.layers.34.input_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5876,5877,hidden_states.1023,hidden_states.1025"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="8057" name="__module.model.layers.34.input_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5878,5880,hidden_states.1027"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="8058" name="self.model.layers.34.self_attn.q_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 128" offset="5642999928" size="13107200" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8059" name="Convert_386707" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8060" name="self.model.layers.34.self_attn.q_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 1" offset="5656107128" size="102400" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8061" name="Convert_386709" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8062" name="self.model.layers.34.self_attn.q_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8063" name="self.model.layers.34.self_attn.q_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="5120, 40, 1" offset="5656209528" size="409600" /> + <output> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8064" name="self.model.layers.34.self_attn.q_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8065" name="Constant_386714" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="792684080" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="8066" name="Reshape_386715" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="8067" name="__module.model.layers.34.self_attn.q_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="8068" name="__module.model.layers.34.self_attn.q_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="8069" name="self.model.layers.34.self_attn.q_proj.bias" type="Const" version="opset1"> + <data element_type="bf16" shape="5120" offset="5656619128" size="10240" /> + <output> + <port id="0" precision="BF16" names="self.model.layers.34.self_attn.q_proj.bias"> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="8070" name="__module.model.layers.34.self_attn.q_proj/prim::PythonOp/ConvertLike_1" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="BF16"> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="8071" name="__module.model.layers.34.self_attn.q_proj/prim::PythonOp/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5890,query_states.69"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="8072" name="Constant_301901" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="792694336" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="8073" name="__module.model.layers.34.self_attn/aten::view/Reshape" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5898"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8074" name="__module.model.layers.34.self_attn/aten::transpose/ScatterElementsUpdate" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="8075" name="__module.model.layers.34.self_attn/aten::transpose/Transpose" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5899,q.69"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8076" name="__module.model.layers.34.self_attn/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5908"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8077" name="__module.model.layers.34.self_attn/aten::size/ShapeOf_3" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="8078" name="__module.model.layers.34.self_attn/aten::size/Constant_3" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="8079" name="__module.model.layers.34.self_attn/aten::size/Gather_3" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="5909,5914" /> + </output> + </layer> + <layer id="8080" name="__module.model.layers.34.self_attn/aten::floor_divide/Divide_1" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" /> + </output> + </layer> + <layer id="8081" name="__module.model.layers.34.self_attn/aten::floor_divide/Floor_1" type="Floor" version="opset1"> + <input> + <port id="0" precision="I64" /> + </input> + <output> + <port id="1" precision="I64" names="5911,5912,5916,5917" /> + </output> + </layer> + <layer id="8082" name="Constant_221055" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8083" name="__module.model.layers.34.self_attn/aten::slice/Reshape_5" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8084" name="__module.model.layers.34.self_attn/aten::slice/Reshape_1" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694676" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8085" name="__module.model.layers.34.self_attn/aten::slice/Reshape_2" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8086" name="__module.model.layers.34.self_attn/aten::slice/Reshape_3" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8087" name="__module.model.layers.34.self_attn/aten::slice/Slice" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="5918,x2.137"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="8088" name="Constant_290392" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1, 1" offset="792694684" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8089" name="__module.model.layers.34.self_attn/aten::neg/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5919"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="8090" name="__module.model.layers.34.self_attn/aten::slice/Reshape_4" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8091" name="__module.model.layers.34.self_attn/aten::slice/Reshape_6" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8092" name="__module.model.layers.34.self_attn/aten::slice/Reshape_7" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8093" name="__module.model.layers.34.self_attn/aten::slice/Slice_1" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="5913"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="8094" name="__module.model.layers.34.self_attn/aten::cat/Concat" type="Concat" version="opset1"> + <data axis="-1" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5921"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8095" name="__module.model.layers.34.self_attn/aten::mul/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5922"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8096" name="__module.model.layers.34.self_attn/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5923"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8097" name="Constant_341659" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="8098" name="Constant_341652" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="12" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8099" name="Constant_341654" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8100" name="Constant_341656" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="20" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8101" name="Concat_341657" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="8102" name="Broadcast_341660" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32" /> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8103" name="ReadValue_333188" type="ReadValue" version="opset6"> + <data variable_id="past_key_values.34.keypresent.34.key" variable_type="f32" variable_shape="?,8,?,128" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="past_key_values.34.key"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8104" name="Constant_325513" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="8105" name="Gather_325514" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8106" name="self.model.layers.34.self_attn.k_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 128" offset="5656629368" size="2621440" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8107" name="Convert_387667" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8108" name="self.model.layers.34.self_attn.k_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 1" offset="5659250808" size="20480" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8109" name="Convert_387669" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8110" name="self.model.layers.34.self_attn.k_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8111" name="self.model.layers.34.self_attn.k_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="1024, 40, 1" offset="5659271288" size="81920" /> + <output> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8112" name="self.model.layers.34.self_attn.k_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8113" name="Constant_387674" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795418528" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="8114" name="Reshape_387675" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="8115" name="__module.model.layers.34.self_attn.k_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="8116" name="__module.model.layers.34.self_attn.k_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="8117" name="self.model.layers.34.self_attn.k_proj.bias" type="Const" version="opset1"> + <data element_type="bf16" shape="1024" offset="5659353208" size="2048" /> + <output> + <port id="0" precision="BF16" names="self.model.layers.34.self_attn.k_proj.bias"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="8118" name="__module.model.layers.34.self_attn.k_proj/prim::PythonOp/ConvertLike_1" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="BF16"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="8119" name="__module.model.layers.34.self_attn.k_proj/prim::PythonOp/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5893,key_states.141"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="8120" name="Constant_301902" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420592" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="8121" name="__module.model.layers.34.self_attn/aten::view/Reshape_1" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5901"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8122" name="__module.model.layers.34.self_attn/aten::transpose/ScatterElementsUpdate_1" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="8123" name="__module.model.layers.34.self_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5902,k.69"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8124" name="__module.model.layers.34.self_attn/aten::mul/Multiply_2" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5924"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8125" name="__module.model.layers.34.self_attn/aten::size/ShapeOf_5" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="8126" name="__module.model.layers.34.self_attn/aten::size/Constant_5" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="8127" name="__module.model.layers.34.self_attn/aten::size/Gather_5" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="5925,5930" /> + </output> + </layer> + <layer id="8128" name="__module.model.layers.34.self_attn/aten::floor_divide/Divide_3" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" /> + </output> + </layer> + <layer id="8129" name="__module.model.layers.34.self_attn/aten::floor_divide/Floor_3" type="Floor" version="opset1"> + <input> + <port id="0" precision="I64" /> + </input> + <output> + <port id="1" precision="I64" names="5927,5928,5932,5933" /> + </output> + </layer> + <layer id="8130" name="Constant_221056" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8131" name="__module.model.layers.34.self_attn/aten::slice/Reshape_13" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8132" name="__module.model.layers.34.self_attn/aten::slice/Reshape_9" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694676" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8133" name="__module.model.layers.34.self_attn/aten::slice/Reshape_10" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8134" name="__module.model.layers.34.self_attn/aten::slice/Reshape_11" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8135" name="__module.model.layers.34.self_attn/aten::slice/Slice_2" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="5934,x2.139"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="8136" name="Constant_290393" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1, 1" offset="792694684" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8137" name="__module.model.layers.34.self_attn/aten::neg/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5935"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="8138" name="__module.model.layers.34.self_attn/aten::slice/Reshape_12" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8139" name="__module.model.layers.34.self_attn/aten::slice/Reshape_14" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8140" name="__module.model.layers.34.self_attn/aten::slice/Reshape_15" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8141" name="__module.model.layers.34.self_attn/aten::slice/Slice_3" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="5929"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="8142" name="__module.model.layers.34.self_attn/aten::cat/Concat_1" type="Concat" version="opset1"> + <data axis="-1" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5937"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8143" name="__module.model.layers.34.self_attn/aten::mul/Multiply_3" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5938"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8144" name="__module.model.layers.34.self_attn/aten::add/Add_1" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5939"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8145" name="__module.model.layers.34.self_attn/aten::cat/Concat_2" type="Concat" version="opset1"> + <data axis="-2" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="present.34.key"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8146" name="__module.model.layers.34.self_attn/aten::unsqueeze/Unsqueeze_2" type="Unsqueeze" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="FP32" names="5951,5952,5953"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8147" name="__module.model.layers.34.self_attn/aten::size/ShapeOf_6" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="8148" name="Constant_302534" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="938477672" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="8149" name="Constant_302535" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="8150" name="Gather_302536" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="8151" name="Constant_269058" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="795420624" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8152" name="Constant_277381" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795420632" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="8153" name="Constant_277382" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="8154" name="Gather_277383" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="8155" name="__module.model.layers.34.self_attn/prim::ListConstruct/Concat_2" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="3" precision="I64" names="5954"> + <dim>5</dim> + </port> + </output> + </layer> + <layer id="8156" name="__module.model.layers.34.self_attn/aten::expand/Broadcast" type="Broadcast" version="opset3"> + <data mode="bidirectional" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>5</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5955,hidden_states.1031"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8157" name="Constant_301903" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420648" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="8158" name="__module.model.layers.34.self_attn/aten::reshape/Reshape" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5959,key_states.143"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8159" name="Constant_341672" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="8160" name="Constant_341665" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="12" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8161" name="Constant_341667" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8162" name="Constant_341669" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="20" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8163" name="Concat_341670" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="8164" name="Broadcast_341673" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32" /> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8165" name="ReadValue_333190" type="ReadValue" version="opset6"> + <data variable_id="past_key_values.34.valuepresent.34.value" variable_type="f32" variable_shape="?,8,?,128" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="past_key_values.34.value"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8166" name="Constant_325516" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="8167" name="Gather_325517" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8168" name="self.model.layers.34.self_attn.v_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 128" offset="5659355256" size="2621440" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8169" name="Convert_387677" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8170" name="self.model.layers.34.self_attn.v_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 1" offset="5661976696" size="20480" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8171" name="Convert_387679" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8172" name="self.model.layers.34.self_attn.v_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8173" name="self.model.layers.34.self_attn.v_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="1024, 40, 1" offset="5661997176" size="81920" /> + <output> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8174" name="self.model.layers.34.self_attn.v_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8175" name="Constant_387684" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795418528" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="8176" name="Reshape_387685" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="8177" name="__module.model.layers.34.self_attn.v_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="8178" name="__module.model.layers.34.self_attn.v_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="8179" name="self.model.layers.34.self_attn.v_proj.bias" type="Const" version="opset1"> + <data element_type="bf16" shape="1024" offset="5662079096" size="2048" /> + <output> + <port id="0" precision="BF16" names="self.model.layers.34.self_attn.v_proj.bias"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="8180" name="__module.model.layers.34.self_attn.v_proj/prim::PythonOp/ConvertLike_1" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="BF16"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="8181" name="__module.model.layers.34.self_attn.v_proj/prim::PythonOp/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5896,value_states.69"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="8182" name="Constant_301904" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420592" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="8183" name="__module.model.layers.34.self_attn/aten::view/Reshape_2" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5904"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8184" name="__module.model.layers.34.self_attn/aten::transpose/ScatterElementsUpdate_2" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="8185" name="__module.model.layers.34.self_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5905"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8186" name="__module.model.layers.34.self_attn/aten::cat/Concat_3" type="Concat" version="opset1"> + <data axis="-2" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="present.34.value"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8187" name="__module.model.layers.34.self_attn/aten::unsqueeze/Unsqueeze_3" type="Unsqueeze" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="FP32" names="5967,5968,5969"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8188" name="__module.model.layers.34.self_attn/aten::size/ShapeOf_10" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="8189" name="Constant_302289" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8190" name="__module.model.layers.34.self_attn/aten::size/Constant_11" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="8191" name="__module.model.layers.34.self_attn/aten::size/Gather_11" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="5961"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8192" name="Constant_269076" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="795420624" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8193" name="Constant_277391" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795420632" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="8194" name="Constant_277392" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="8195" name="Gather_277393" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="8196" name="__module.model.layers.34.self_attn/prim::ListConstruct/Concat_5" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="4" precision="I64" names="5970"> + <dim>5</dim> + </port> + </output> + </layer> + <layer id="8197" name="__module.model.layers.34.self_attn/aten::expand/Broadcast_1" type="Broadcast" version="opset3"> + <data mode="bidirectional" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>5</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5971,hidden_states.1035"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8198" name="Constant_301905" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420648" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="8199" name="__module.model.layers.34.self_attn/aten::reshape/Reshape_1" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5975"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8200" name="__module.model.layers.34.self_attn/aten::slice/Reshape_60" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8201" name="ShapeOf_300504" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="8202" name="Constant_300505" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694668" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8203" name="Constant_300506" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="8204" name="Gather_300507" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8205" name="ShapeOf_300508" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="8206" name="Constant_300509" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694668" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8207" name="Constant_300510" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="8208" name="Gather_300511" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8209" name="Add_300512" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64" names="5976"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8210" name="__module.model.layers.34.self_attn/aten::slice/Reshape_62" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8211" name="__module.model.layers.34.self_attn/aten::slice/Reshape_63" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8212" name="__module.model.layers.34.self_attn/aten::slice/Slice_15" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="5980"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="8213" name="__module.model.layers.34.self_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> + <data causal="false" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="5981,attn_output.137"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8214" name="__module.model.layers.34.self_attn/aten::transpose/ScatterElementsUpdate_3" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="8215" name="__module.model.layers.34.self_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5982"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8216" name="Constant_301906" type="Const" version="opset1"> + <data element_type="i64" shape="3" offset="798146608" size="24" /> + <output> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="8217" name="__module.model.layers.34.self_attn/aten::view/Reshape_3" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>3</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5985"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="8218" name="self.model.layers.34.self_attn.o_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 128" offset="5662081144" size="13107200" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8219" name="Convert_386717" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8220" name="self.model.layers.34.self_attn.o_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 1" offset="5675188344" size="102400" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8221" name="Convert_386719" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8222" name="self.model.layers.34.self_attn.o_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8223" name="self.model.layers.34.self_attn.o_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="5120, 40, 1" offset="5675290744" size="409600" /> + <output> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8224" name="self.model.layers.34.self_attn.o_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8225" name="Constant_386724" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="792684080" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="8226" name="Reshape_386725" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="8227" name="__module.model.layers.34.self_attn.o_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="8228" name="__module.model.layers.34.self_attn.o_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5987,5989,hidden_states.1037"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="8229" name="__module.model.layers.34/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5992,5994,6005,hidden_states.1039,hidden_states.1041"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="8230" name="Constant_290397" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 5120" offset="5675700344" size="20480" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="8231" name="Constant_290396" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064860" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8232" name="Constant_290394" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064864" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8233" name="__module.model.layers.34.post_attention_layernorm/aten::pow/Power" type="Power" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5995"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="8234" name="Constant_23972" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64" names="5996"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8235" name="__module.model.layers.34.post_attention_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> + <data keep_dims="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5997,variance.139"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8236" name="Constant_290395" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064876" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8237" name="__module.model.layers.34.post_attention_layernorm/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5998"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8238" name="__module.model.layers.34.post_attention_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8239" name="__module.model.layers.34.post_attention_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="5999"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8240" name="__module.model.layers.34.post_attention_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6000,6001,hidden_states.1043,hidden_states.1045"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="8241" name="__module.model.layers.34.post_attention_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6002,6004"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="8242" name="self.model.layers.34.mlp.gate_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 128" offset="5675720824" size="35389440" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8243" name="Convert_385617" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8244" name="self.model.layers.34.mlp.gate_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 1" offset="5711110264" size="276480" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8245" name="Convert_385619" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8246" name="self.model.layers.34.mlp.gate_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8247" name="self.model.layers.34.mlp.gate_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="13824, 40, 1" offset="5711386744" size="1105920" /> + <output> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8248" name="self.model.layers.34.mlp.gate_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8249" name="Constant_385624" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="848558152" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="8250" name="Reshape_385625" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="8251" name="__module.model.layers.34.mlp.gate_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="8252" name="__module.model.layers.34.mlp.gate_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6010,input.69"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="8253" name="__module.model.layers.34.mlp.act_fn/aten::silu/Swish" type="Swish" version="opset4"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="6011"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="8254" name="self.model.layers.34.mlp.up_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 128" offset="5712492664" size="35389440" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8255" name="Convert_385607" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8256" name="self.model.layers.34.mlp.up_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 1" offset="5747882104" size="276480" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8257" name="Convert_385609" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8258" name="self.model.layers.34.mlp.up_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8259" name="self.model.layers.34.mlp.up_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="13824, 40, 1" offset="5748158584" size="1105920" /> + <output> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8260" name="self.model.layers.34.mlp.up_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8261" name="Constant_385614" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="848558152" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="8262" name="Reshape_385615" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="8263" name="__module.model.layers.34.mlp.up_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="8264" name="__module.model.layers.34.mlp.up_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6013"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="8265" name="__module.model.layers.34.mlp/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6014"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="8266" name="self.model.layers.34.mlp.down_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 108, 128" offset="5749264504" size="35389440" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8267" name="Convert_385627" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8268" name="self.model.layers.34.mlp.down_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 108, 1" offset="5784653944" size="276480" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8269" name="Convert_385629" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8270" name="self.model.layers.34.mlp.down_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8271" name="self.model.layers.34.mlp.down_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="5120, 108, 1" offset="5784930424" size="1105920" /> + <output> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8272" name="self.model.layers.34.mlp.down_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8273" name="Constant_385634" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="922101848" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="8274" name="Reshape_385635" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="8275" name="__module.model.layers.34.mlp.down_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="8276" name="__module.model.layers.34.mlp.down_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6016,hidden_states.1047"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="8277" name="__module.model.layers.34/aten::add/Add_1" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6017,6019,6027,6038,hidden_states.1049,hidden_states.1051"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="8278" name="Constant_290401" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 5120" offset="5786036344" size="20480" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="8279" name="Constant_290400" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064860" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8280" name="Constant_290398" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064864" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8281" name="__module.model.layers.35.input_layernorm/aten::pow/Power" type="Power" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6028"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="8282" name="Constant_24046" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64" names="6029"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8283" name="__module.model.layers.35.input_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> + <data keep_dims="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6030,variance.141"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8284" name="Constant_290399" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064876" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8285" name="__module.model.layers.35.input_layernorm/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6031"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8286" name="__module.model.layers.35.input_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8287" name="__module.model.layers.35.input_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6032"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8288" name="__module.model.layers.35.input_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6033,6034,hidden_states.1053,hidden_states.1055"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="8289" name="__module.model.layers.35.input_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6035,6037,hidden_states.1057"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="8290" name="self.model.layers.35.self_attn.q_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 128" offset="5786056824" size="13107200" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8291" name="Convert_386727" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8292" name="self.model.layers.35.self_attn.q_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 1" offset="5799164024" size="102400" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8293" name="Convert_386729" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8294" name="self.model.layers.35.self_attn.q_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8295" name="self.model.layers.35.self_attn.q_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="5120, 40, 1" offset="5799266424" size="409600" /> + <output> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8296" name="self.model.layers.35.self_attn.q_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8297" name="Constant_386734" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="792684080" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="8298" name="Reshape_386735" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="8299" name="__module.model.layers.35.self_attn.q_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="8300" name="__module.model.layers.35.self_attn.q_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="8301" name="self.model.layers.35.self_attn.q_proj.bias" type="Const" version="opset1"> + <data element_type="bf16" shape="5120" offset="5799676024" size="10240" /> + <output> + <port id="0" precision="BF16" names="self.model.layers.35.self_attn.q_proj.bias"> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="8302" name="__module.model.layers.35.self_attn.q_proj/prim::PythonOp/ConvertLike_1" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="BF16"> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="8303" name="__module.model.layers.35.self_attn.q_proj/prim::PythonOp/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6047,query_states.71"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="8304" name="Constant_301907" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="792694336" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="8305" name="__module.model.layers.35.self_attn/aten::view/Reshape" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6055"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8306" name="__module.model.layers.35.self_attn/aten::transpose/ScatterElementsUpdate" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="8307" name="__module.model.layers.35.self_attn/aten::transpose/Transpose" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6056,q.71"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8308" name="__module.model.layers.35.self_attn/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6065"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8309" name="__module.model.layers.35.self_attn/aten::size/ShapeOf_3" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="8310" name="__module.model.layers.35.self_attn/aten::size/Constant_3" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="8311" name="__module.model.layers.35.self_attn/aten::size/Gather_3" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="6066,6071" /> + </output> + </layer> + <layer id="8312" name="__module.model.layers.35.self_attn/aten::floor_divide/Divide_1" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" /> + </output> + </layer> + <layer id="8313" name="__module.model.layers.35.self_attn/aten::floor_divide/Floor_1" type="Floor" version="opset1"> + <input> + <port id="0" precision="I64" /> + </input> + <output> + <port id="1" precision="I64" names="6068,6069,6073,6074" /> + </output> + </layer> + <layer id="8314" name="Constant_221070" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8315" name="__module.model.layers.35.self_attn/aten::slice/Reshape_5" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8316" name="__module.model.layers.35.self_attn/aten::slice/Reshape_1" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694676" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8317" name="__module.model.layers.35.self_attn/aten::slice/Reshape_2" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8318" name="__module.model.layers.35.self_attn/aten::slice/Reshape_3" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8319" name="__module.model.layers.35.self_attn/aten::slice/Slice" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="6075,x2.141"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="8320" name="Constant_290402" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1, 1" offset="792694684" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8321" name="__module.model.layers.35.self_attn/aten::neg/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6076"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="8322" name="__module.model.layers.35.self_attn/aten::slice/Reshape_4" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8323" name="__module.model.layers.35.self_attn/aten::slice/Reshape_6" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8324" name="__module.model.layers.35.self_attn/aten::slice/Reshape_7" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8325" name="__module.model.layers.35.self_attn/aten::slice/Slice_1" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="6070"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="8326" name="__module.model.layers.35.self_attn/aten::cat/Concat" type="Concat" version="opset1"> + <data axis="-1" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6078"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8327" name="__module.model.layers.35.self_attn/aten::mul/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6079"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8328" name="__module.model.layers.35.self_attn/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6080"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8329" name="Constant_341685" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="8330" name="Constant_341678" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="12" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8331" name="Constant_341680" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8332" name="Constant_341682" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="20" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8333" name="Concat_341683" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="8334" name="Broadcast_341686" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32" /> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8335" name="ReadValue_333192" type="ReadValue" version="opset6"> + <data variable_id="past_key_values.35.keypresent.35.key" variable_type="f32" variable_shape="?,8,?,128" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="past_key_values.35.key"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8336" name="Constant_325519" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="8337" name="Gather_325520" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8338" name="self.model.layers.35.self_attn.k_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 128" offset="5799686264" size="2621440" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8339" name="Convert_387687" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8340" name="self.model.layers.35.self_attn.k_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 1" offset="5802307704" size="20480" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8341" name="Convert_387689" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8342" name="self.model.layers.35.self_attn.k_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8343" name="self.model.layers.35.self_attn.k_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="1024, 40, 1" offset="5802328184" size="81920" /> + <output> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8344" name="self.model.layers.35.self_attn.k_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8345" name="Constant_387694" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795418528" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="8346" name="Reshape_387695" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="8347" name="__module.model.layers.35.self_attn.k_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="8348" name="__module.model.layers.35.self_attn.k_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="8349" name="self.model.layers.35.self_attn.k_proj.bias" type="Const" version="opset1"> + <data element_type="bf16" shape="1024" offset="5802410104" size="2048" /> + <output> + <port id="0" precision="BF16" names="self.model.layers.35.self_attn.k_proj.bias"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="8350" name="__module.model.layers.35.self_attn.k_proj/prim::PythonOp/ConvertLike_1" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="BF16"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="8351" name="__module.model.layers.35.self_attn.k_proj/prim::PythonOp/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6050,key_states.145"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="8352" name="Constant_301908" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420592" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="8353" name="__module.model.layers.35.self_attn/aten::view/Reshape_1" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6058"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8354" name="__module.model.layers.35.self_attn/aten::transpose/ScatterElementsUpdate_1" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="8355" name="__module.model.layers.35.self_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6059,k.71"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8356" name="__module.model.layers.35.self_attn/aten::mul/Multiply_2" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6081"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8357" name="__module.model.layers.35.self_attn/aten::size/ShapeOf_5" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="8358" name="__module.model.layers.35.self_attn/aten::size/Constant_5" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="8359" name="__module.model.layers.35.self_attn/aten::size/Gather_5" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="6082,6087" /> + </output> + </layer> + <layer id="8360" name="__module.model.layers.35.self_attn/aten::floor_divide/Divide_3" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" /> + </output> + </layer> + <layer id="8361" name="__module.model.layers.35.self_attn/aten::floor_divide/Floor_3" type="Floor" version="opset1"> + <input> + <port id="0" precision="I64" /> + </input> + <output> + <port id="1" precision="I64" names="6084,6085,6089,6090" /> + </output> + </layer> + <layer id="8362" name="Constant_221071" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8363" name="__module.model.layers.35.self_attn/aten::slice/Reshape_13" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8364" name="__module.model.layers.35.self_attn/aten::slice/Reshape_9" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694676" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8365" name="__module.model.layers.35.self_attn/aten::slice/Reshape_10" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8366" name="__module.model.layers.35.self_attn/aten::slice/Reshape_11" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8367" name="__module.model.layers.35.self_attn/aten::slice/Slice_2" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="6091,x2.143"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="8368" name="Constant_290403" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1, 1" offset="792694684" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8369" name="__module.model.layers.35.self_attn/aten::neg/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6092"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="8370" name="__module.model.layers.35.self_attn/aten::slice/Reshape_12" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8371" name="__module.model.layers.35.self_attn/aten::slice/Reshape_14" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8372" name="__module.model.layers.35.self_attn/aten::slice/Reshape_15" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8373" name="__module.model.layers.35.self_attn/aten::slice/Slice_3" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="6086"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="8374" name="__module.model.layers.35.self_attn/aten::cat/Concat_1" type="Concat" version="opset1"> + <data axis="-1" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6094"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8375" name="__module.model.layers.35.self_attn/aten::mul/Multiply_3" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6095"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8376" name="__module.model.layers.35.self_attn/aten::add/Add_1" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6096"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8377" name="__module.model.layers.35.self_attn/aten::cat/Concat_2" type="Concat" version="opset1"> + <data axis="-2" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="present.35.key"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8378" name="__module.model.layers.35.self_attn/aten::unsqueeze/Unsqueeze_2" type="Unsqueeze" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="FP32" names="6108,6109,6110"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8379" name="__module.model.layers.35.self_attn/aten::size/ShapeOf_6" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="8380" name="Constant_302539" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="938477672" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="8381" name="Constant_302540" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="8382" name="Gather_302541" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="8383" name="Constant_269094" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="795420624" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8384" name="Constant_277416" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795420632" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="8385" name="Constant_277417" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="8386" name="Gather_277418" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="8387" name="__module.model.layers.35.self_attn/prim::ListConstruct/Concat_2" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="3" precision="I64" names="6111"> + <dim>5</dim> + </port> + </output> + </layer> + <layer id="8388" name="__module.model.layers.35.self_attn/aten::expand/Broadcast" type="Broadcast" version="opset3"> + <data mode="bidirectional" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>5</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6112,hidden_states.1061"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8389" name="Constant_301909" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420648" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="8390" name="__module.model.layers.35.self_attn/aten::reshape/Reshape" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6116,key_states.147"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8391" name="Constant_341698" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="8392" name="Constant_341691" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="12" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8393" name="Constant_341693" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8394" name="Constant_341695" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="20" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8395" name="Concat_341696" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="8396" name="Broadcast_341699" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32" /> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8397" name="ReadValue_333194" type="ReadValue" version="opset6"> + <data variable_id="past_key_values.35.valuepresent.35.value" variable_type="f32" variable_shape="?,8,?,128" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="past_key_values.35.value"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8398" name="Constant_325522" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="8399" name="Gather_325523" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8400" name="self.model.layers.35.self_attn.v_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 128" offset="5802412152" size="2621440" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8401" name="Convert_387697" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8402" name="self.model.layers.35.self_attn.v_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 1" offset="5805033592" size="20480" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8403" name="Convert_387699" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8404" name="self.model.layers.35.self_attn.v_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8405" name="self.model.layers.35.self_attn.v_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="1024, 40, 1" offset="5805054072" size="81920" /> + <output> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8406" name="self.model.layers.35.self_attn.v_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8407" name="Constant_387704" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795418528" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="8408" name="Reshape_387705" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="8409" name="__module.model.layers.35.self_attn.v_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="8410" name="__module.model.layers.35.self_attn.v_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="8411" name="self.model.layers.35.self_attn.v_proj.bias" type="Const" version="opset1"> + <data element_type="bf16" shape="1024" offset="5805135992" size="2048" /> + <output> + <port id="0" precision="BF16" names="self.model.layers.35.self_attn.v_proj.bias"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="8412" name="__module.model.layers.35.self_attn.v_proj/prim::PythonOp/ConvertLike_1" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="BF16"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="8413" name="__module.model.layers.35.self_attn.v_proj/prim::PythonOp/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6053,value_states.71"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="8414" name="Constant_301910" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420592" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="8415" name="__module.model.layers.35.self_attn/aten::view/Reshape_2" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6061"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8416" name="__module.model.layers.35.self_attn/aten::transpose/ScatterElementsUpdate_2" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="8417" name="__module.model.layers.35.self_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6062"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8418" name="__module.model.layers.35.self_attn/aten::cat/Concat_3" type="Concat" version="opset1"> + <data axis="-2" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="present.35.value"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8419" name="__module.model.layers.35.self_attn/aten::unsqueeze/Unsqueeze_3" type="Unsqueeze" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="FP32" names="6124,6125,6126"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8420" name="__module.model.layers.35.self_attn/aten::size/ShapeOf_10" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="8421" name="Constant_302295" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8422" name="__module.model.layers.35.self_attn/aten::size/Constant_11" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="8423" name="__module.model.layers.35.self_attn/aten::size/Gather_11" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="6118"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8424" name="Constant_269112" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="795420624" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8425" name="Constant_277426" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795420632" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="8426" name="Constant_277427" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="8427" name="Gather_277428" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="8428" name="__module.model.layers.35.self_attn/prim::ListConstruct/Concat_5" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="4" precision="I64" names="6127"> + <dim>5</dim> + </port> + </output> + </layer> + <layer id="8429" name="__module.model.layers.35.self_attn/aten::expand/Broadcast_1" type="Broadcast" version="opset3"> + <data mode="bidirectional" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>5</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6128,hidden_states.1065"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8430" name="Constant_301911" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420648" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="8431" name="__module.model.layers.35.self_attn/aten::reshape/Reshape_1" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6132"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8432" name="__module.model.layers.35.self_attn/aten::slice/Reshape_60" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8433" name="ShapeOf_300590" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="8434" name="Constant_300591" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694668" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8435" name="Constant_300592" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="8436" name="Gather_300593" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8437" name="ShapeOf_300594" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="8438" name="Constant_300595" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694668" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8439" name="Constant_300596" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="8440" name="Gather_300597" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8441" name="Add_300598" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64" names="6133"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8442" name="__module.model.layers.35.self_attn/aten::slice/Reshape_62" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8443" name="__module.model.layers.35.self_attn/aten::slice/Reshape_63" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8444" name="__module.model.layers.35.self_attn/aten::slice/Slice_15" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="6137"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="8445" name="__module.model.layers.35.self_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> + <data causal="false" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="6138,attn_output.141"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8446" name="__module.model.layers.35.self_attn/aten::transpose/ScatterElementsUpdate_3" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="8447" name="__module.model.layers.35.self_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6139"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8448" name="Constant_301912" type="Const" version="opset1"> + <data element_type="i64" shape="3" offset="798146608" size="24" /> + <output> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="8449" name="__module.model.layers.35.self_attn/aten::view/Reshape_3" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>3</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6142"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="8450" name="self.model.layers.35.self_attn.o_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 128" offset="5805138040" size="13107200" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8451" name="Convert_386737" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8452" name="self.model.layers.35.self_attn.o_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 1" offset="5818245240" size="102400" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8453" name="Convert_386739" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8454" name="self.model.layers.35.self_attn.o_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8455" name="self.model.layers.35.self_attn.o_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="5120, 40, 1" offset="5818347640" size="409600" /> + <output> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8456" name="self.model.layers.35.self_attn.o_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8457" name="Constant_386744" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="792684080" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="8458" name="Reshape_386745" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="8459" name="__module.model.layers.35.self_attn.o_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="8460" name="__module.model.layers.35.self_attn.o_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6144,6146,hidden_states.1067"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="8461" name="__module.model.layers.35/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6149,6151,6162,hidden_states.1069,hidden_states.1071"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="8462" name="Constant_290407" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 5120" offset="5818757240" size="20480" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="8463" name="Constant_290406" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064860" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8464" name="Constant_290404" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064864" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8465" name="__module.model.layers.35.post_attention_layernorm/aten::pow/Power" type="Power" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6152"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="8466" name="Constant_24644" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64" names="6153"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8467" name="__module.model.layers.35.post_attention_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> + <data keep_dims="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6154,variance.143"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8468" name="Constant_290405" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064876" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8469" name="__module.model.layers.35.post_attention_layernorm/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6155"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8470" name="__module.model.layers.35.post_attention_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8471" name="__module.model.layers.35.post_attention_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6156"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8472" name="__module.model.layers.35.post_attention_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6157,6158,hidden_states.1073,hidden_states.1075"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="8473" name="__module.model.layers.35.post_attention_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6159,6161"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="8474" name="self.model.layers.35.mlp.gate_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 128" offset="5818777720" size="35389440" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8475" name="Convert_385647" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8476" name="self.model.layers.35.mlp.gate_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 1" offset="5854167160" size="276480" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8477" name="Convert_385649" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8478" name="self.model.layers.35.mlp.gate_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8479" name="self.model.layers.35.mlp.gate_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="13824, 40, 1" offset="5854443640" size="1105920" /> + <output> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8480" name="self.model.layers.35.mlp.gate_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8481" name="Constant_385654" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="848558152" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="8482" name="Reshape_385655" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="8483" name="__module.model.layers.35.mlp.gate_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="8484" name="__module.model.layers.35.mlp.gate_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6167,input.71"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="8485" name="__module.model.layers.35.mlp.act_fn/aten::silu/Swish" type="Swish" version="opset4"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="6168"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="8486" name="self.model.layers.35.mlp.up_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 128" offset="5855549560" size="35389440" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8487" name="Convert_385637" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8488" name="self.model.layers.35.mlp.up_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 1" offset="5890939000" size="276480" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8489" name="Convert_385639" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8490" name="self.model.layers.35.mlp.up_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8491" name="self.model.layers.35.mlp.up_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="13824, 40, 1" offset="5891215480" size="1105920" /> + <output> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8492" name="self.model.layers.35.mlp.up_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8493" name="Constant_385644" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="848558152" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="8494" name="Reshape_385645" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="8495" name="__module.model.layers.35.mlp.up_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="8496" name="__module.model.layers.35.mlp.up_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6170"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="8497" name="__module.model.layers.35.mlp/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6171"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="8498" name="self.model.layers.35.mlp.down_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 108, 128" offset="5892321400" size="35389440" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8499" name="Convert_385657" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8500" name="self.model.layers.35.mlp.down_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 108, 1" offset="5927710840" size="276480" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8501" name="Convert_385659" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8502" name="self.model.layers.35.mlp.down_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8503" name="self.model.layers.35.mlp.down_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="5120, 108, 1" offset="5927987320" size="1105920" /> + <output> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8504" name="self.model.layers.35.mlp.down_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8505" name="Constant_385664" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="922101848" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="8506" name="Reshape_385665" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="8507" name="__module.model.layers.35.mlp.down_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="8508" name="__module.model.layers.35.mlp.down_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6173,hidden_states.1077"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="8509" name="__module.model.layers.35/aten::add/Add_1" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6174,6176,6184,6195,hidden_states.1079,hidden_states.1081"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="8510" name="Constant_290411" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 5120" offset="5929093240" size="20480" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="8511" name="Constant_290410" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064860" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8512" name="Constant_290408" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064864" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8513" name="__module.model.layers.36.input_layernorm/aten::pow/Power" type="Power" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6185"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="8514" name="Constant_24718" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64" names="6186"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8515" name="__module.model.layers.36.input_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> + <data keep_dims="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6187,variance.145"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8516" name="Constant_290409" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064876" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8517" name="__module.model.layers.36.input_layernorm/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6188"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8518" name="__module.model.layers.36.input_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8519" name="__module.model.layers.36.input_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6189"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8520" name="__module.model.layers.36.input_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6190,6191,hidden_states.1083,hidden_states.1085"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="8521" name="__module.model.layers.36.input_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6192,6194,hidden_states.1087"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="8522" name="self.model.layers.36.self_attn.q_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 128" offset="5929113720" size="13107200" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8523" name="Convert_386747" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8524" name="self.model.layers.36.self_attn.q_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 1" offset="5942220920" size="102400" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8525" name="Convert_386749" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8526" name="self.model.layers.36.self_attn.q_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8527" name="self.model.layers.36.self_attn.q_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="5120, 40, 1" offset="5942323320" size="409600" /> + <output> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8528" name="self.model.layers.36.self_attn.q_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8529" name="Constant_386754" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="792684080" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="8530" name="Reshape_386755" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="8531" name="__module.model.layers.36.self_attn.q_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="8532" name="__module.model.layers.36.self_attn.q_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="8533" name="self.model.layers.36.self_attn.q_proj.bias" type="Const" version="opset1"> + <data element_type="bf16" shape="5120" offset="5942732920" size="10240" /> + <output> + <port id="0" precision="BF16" names="self.model.layers.36.self_attn.q_proj.bias"> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="8534" name="__module.model.layers.36.self_attn.q_proj/prim::PythonOp/ConvertLike_1" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="BF16"> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="8535" name="__module.model.layers.36.self_attn.q_proj/prim::PythonOp/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6204,query_states.73"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="8536" name="Constant_301913" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="792694336" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="8537" name="__module.model.layers.36.self_attn/aten::view/Reshape" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6212"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8538" name="__module.model.layers.36.self_attn/aten::transpose/ScatterElementsUpdate" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="8539" name="__module.model.layers.36.self_attn/aten::transpose/Transpose" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6213,q.73"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8540" name="__module.model.layers.36.self_attn/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6222"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8541" name="__module.model.layers.36.self_attn/aten::size/ShapeOf_3" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="8542" name="__module.model.layers.36.self_attn/aten::size/Constant_3" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="8543" name="__module.model.layers.36.self_attn/aten::size/Gather_3" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="6223,6228" /> + </output> + </layer> + <layer id="8544" name="__module.model.layers.36.self_attn/aten::floor_divide/Divide_1" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" /> + </output> + </layer> + <layer id="8545" name="__module.model.layers.36.self_attn/aten::floor_divide/Floor_1" type="Floor" version="opset1"> + <input> + <port id="0" precision="I64" /> + </input> + <output> + <port id="1" precision="I64" names="6225,6226,6230,6231" /> + </output> + </layer> + <layer id="8546" name="Constant_221085" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8547" name="__module.model.layers.36.self_attn/aten::slice/Reshape_5" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8548" name="__module.model.layers.36.self_attn/aten::slice/Reshape_1" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694676" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8549" name="__module.model.layers.36.self_attn/aten::slice/Reshape_2" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8550" name="__module.model.layers.36.self_attn/aten::slice/Reshape_3" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8551" name="__module.model.layers.36.self_attn/aten::slice/Slice" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="6232,x2.145"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="8552" name="Constant_290412" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1, 1" offset="792694684" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8553" name="__module.model.layers.36.self_attn/aten::neg/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6233"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="8554" name="__module.model.layers.36.self_attn/aten::slice/Reshape_4" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8555" name="__module.model.layers.36.self_attn/aten::slice/Reshape_6" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8556" name="__module.model.layers.36.self_attn/aten::slice/Reshape_7" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8557" name="__module.model.layers.36.self_attn/aten::slice/Slice_1" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="6227"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="8558" name="__module.model.layers.36.self_attn/aten::cat/Concat" type="Concat" version="opset1"> + <data axis="-1" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6235"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8559" name="__module.model.layers.36.self_attn/aten::mul/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6236"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8560" name="__module.model.layers.36.self_attn/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6237"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8561" name="Constant_341711" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="8562" name="Constant_341704" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="12" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8563" name="Constant_341706" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8564" name="Constant_341708" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="20" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8565" name="Concat_341709" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="8566" name="Broadcast_341712" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32" /> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8567" name="ReadValue_333196" type="ReadValue" version="opset6"> + <data variable_id="past_key_values.36.keypresent.36.key" variable_type="f32" variable_shape="?,8,?,128" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="past_key_values.36.key"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8568" name="Constant_325525" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="8569" name="Gather_325526" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8570" name="self.model.layers.36.self_attn.k_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 128" offset="5942743160" size="2621440" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8571" name="Convert_387707" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8572" name="self.model.layers.36.self_attn.k_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 1" offset="5945364600" size="20480" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8573" name="Convert_387709" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8574" name="self.model.layers.36.self_attn.k_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8575" name="self.model.layers.36.self_attn.k_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="1024, 40, 1" offset="5945385080" size="81920" /> + <output> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8576" name="self.model.layers.36.self_attn.k_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8577" name="Constant_387714" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795418528" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="8578" name="Reshape_387715" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="8579" name="__module.model.layers.36.self_attn.k_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="8580" name="__module.model.layers.36.self_attn.k_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="8581" name="self.model.layers.36.self_attn.k_proj.bias" type="Const" version="opset1"> + <data element_type="bf16" shape="1024" offset="5945467000" size="2048" /> + <output> + <port id="0" precision="BF16" names="self.model.layers.36.self_attn.k_proj.bias"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="8582" name="__module.model.layers.36.self_attn.k_proj/prim::PythonOp/ConvertLike_1" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="BF16"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="8583" name="__module.model.layers.36.self_attn.k_proj/prim::PythonOp/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6207,key_states.149"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="8584" name="Constant_301914" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420592" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="8585" name="__module.model.layers.36.self_attn/aten::view/Reshape_1" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6215"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8586" name="__module.model.layers.36.self_attn/aten::transpose/ScatterElementsUpdate_1" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="8587" name="__module.model.layers.36.self_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6216,k.73"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8588" name="__module.model.layers.36.self_attn/aten::mul/Multiply_2" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6238"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8589" name="__module.model.layers.36.self_attn/aten::size/ShapeOf_5" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="8590" name="__module.model.layers.36.self_attn/aten::size/Constant_5" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="8591" name="__module.model.layers.36.self_attn/aten::size/Gather_5" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="6239,6244" /> + </output> + </layer> + <layer id="8592" name="__module.model.layers.36.self_attn/aten::floor_divide/Divide_3" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" /> + </output> + </layer> + <layer id="8593" name="__module.model.layers.36.self_attn/aten::floor_divide/Floor_3" type="Floor" version="opset1"> + <input> + <port id="0" precision="I64" /> + </input> + <output> + <port id="1" precision="I64" names="6241,6242,6246,6247" /> + </output> + </layer> + <layer id="8594" name="Constant_221086" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8595" name="__module.model.layers.36.self_attn/aten::slice/Reshape_13" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8596" name="__module.model.layers.36.self_attn/aten::slice/Reshape_9" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694676" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8597" name="__module.model.layers.36.self_attn/aten::slice/Reshape_10" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8598" name="__module.model.layers.36.self_attn/aten::slice/Reshape_11" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8599" name="__module.model.layers.36.self_attn/aten::slice/Slice_2" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="6248,x2.147"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="8600" name="Constant_290413" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1, 1" offset="792694684" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8601" name="__module.model.layers.36.self_attn/aten::neg/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6249"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="8602" name="__module.model.layers.36.self_attn/aten::slice/Reshape_12" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8603" name="__module.model.layers.36.self_attn/aten::slice/Reshape_14" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8604" name="__module.model.layers.36.self_attn/aten::slice/Reshape_15" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8605" name="__module.model.layers.36.self_attn/aten::slice/Slice_3" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="6243"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="8606" name="__module.model.layers.36.self_attn/aten::cat/Concat_1" type="Concat" version="opset1"> + <data axis="-1" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6251"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8607" name="__module.model.layers.36.self_attn/aten::mul/Multiply_3" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6252"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8608" name="__module.model.layers.36.self_attn/aten::add/Add_1" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6253"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8609" name="__module.model.layers.36.self_attn/aten::cat/Concat_2" type="Concat" version="opset1"> + <data axis="-2" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="present.36.key"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8610" name="__module.model.layers.36.self_attn/aten::unsqueeze/Unsqueeze_2" type="Unsqueeze" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="FP32" names="6265,6266,6267"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8611" name="__module.model.layers.36.self_attn/aten::size/ShapeOf_6" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="8612" name="Constant_302544" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="938477672" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="8613" name="Constant_302545" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="8614" name="Gather_302546" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="8615" name="Constant_269130" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="795420624" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8616" name="Constant_277451" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795420632" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="8617" name="Constant_277452" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="8618" name="Gather_277453" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="8619" name="__module.model.layers.36.self_attn/prim::ListConstruct/Concat_2" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="3" precision="I64" names="6268"> + <dim>5</dim> + </port> + </output> + </layer> + <layer id="8620" name="__module.model.layers.36.self_attn/aten::expand/Broadcast" type="Broadcast" version="opset3"> + <data mode="bidirectional" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>5</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6269,hidden_states.1091"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8621" name="Constant_301915" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420648" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="8622" name="__module.model.layers.36.self_attn/aten::reshape/Reshape" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6273,key_states.151"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8623" name="Constant_341724" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="8624" name="Constant_341717" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="12" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8625" name="Constant_341719" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8626" name="Constant_341721" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="20" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8627" name="Concat_341722" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="8628" name="Broadcast_341725" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32" /> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8629" name="ReadValue_333198" type="ReadValue" version="opset6"> + <data variable_id="past_key_values.36.valuepresent.36.value" variable_type="f32" variable_shape="?,8,?,128" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="past_key_values.36.value"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8630" name="Constant_325528" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="8631" name="Gather_325529" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8632" name="self.model.layers.36.self_attn.v_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 128" offset="5945469048" size="2621440" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8633" name="Convert_387717" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8634" name="self.model.layers.36.self_attn.v_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 1" offset="5948090488" size="20480" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8635" name="Convert_387719" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8636" name="self.model.layers.36.self_attn.v_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8637" name="self.model.layers.36.self_attn.v_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="1024, 40, 1" offset="5948110968" size="81920" /> + <output> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8638" name="self.model.layers.36.self_attn.v_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8639" name="Constant_387724" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795418528" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="8640" name="Reshape_387725" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="8641" name="__module.model.layers.36.self_attn.v_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="8642" name="__module.model.layers.36.self_attn.v_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="8643" name="self.model.layers.36.self_attn.v_proj.bias" type="Const" version="opset1"> + <data element_type="bf16" shape="1024" offset="5948192888" size="2048" /> + <output> + <port id="0" precision="BF16" names="self.model.layers.36.self_attn.v_proj.bias"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="8644" name="__module.model.layers.36.self_attn.v_proj/prim::PythonOp/ConvertLike_1" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="BF16"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="8645" name="__module.model.layers.36.self_attn.v_proj/prim::PythonOp/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6210,value_states.73"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="8646" name="Constant_301916" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420592" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="8647" name="__module.model.layers.36.self_attn/aten::view/Reshape_2" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6218"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8648" name="__module.model.layers.36.self_attn/aten::transpose/ScatterElementsUpdate_2" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="8649" name="__module.model.layers.36.self_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6219"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8650" name="__module.model.layers.36.self_attn/aten::cat/Concat_3" type="Concat" version="opset1"> + <data axis="-2" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="present.36.value"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8651" name="__module.model.layers.36.self_attn/aten::unsqueeze/Unsqueeze_3" type="Unsqueeze" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="FP32" names="6281,6282,6283"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8652" name="__module.model.layers.36.self_attn/aten::size/ShapeOf_10" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="8653" name="Constant_302301" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8654" name="__module.model.layers.36.self_attn/aten::size/Constant_11" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="8655" name="__module.model.layers.36.self_attn/aten::size/Gather_11" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="6275"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8656" name="Constant_269148" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="795420624" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8657" name="Constant_277461" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795420632" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="8658" name="Constant_277462" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="8659" name="Gather_277463" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="8660" name="__module.model.layers.36.self_attn/prim::ListConstruct/Concat_5" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="4" precision="I64" names="6284"> + <dim>5</dim> + </port> + </output> + </layer> + <layer id="8661" name="__module.model.layers.36.self_attn/aten::expand/Broadcast_1" type="Broadcast" version="opset3"> + <data mode="bidirectional" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>5</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6285,hidden_states.1095"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8662" name="Constant_301917" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420648" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="8663" name="__module.model.layers.36.self_attn/aten::reshape/Reshape_1" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6289"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8664" name="__module.model.layers.36.self_attn/aten::slice/Reshape_60" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8665" name="ShapeOf_300676" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="8666" name="Constant_300677" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694668" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8667" name="Constant_300678" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="8668" name="Gather_300679" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8669" name="ShapeOf_300680" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="8670" name="Constant_300681" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694668" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8671" name="Constant_300682" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="8672" name="Gather_300683" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8673" name="Add_300684" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64" names="6290"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8674" name="__module.model.layers.36.self_attn/aten::slice/Reshape_62" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8675" name="__module.model.layers.36.self_attn/aten::slice/Reshape_63" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8676" name="__module.model.layers.36.self_attn/aten::slice/Slice_15" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="6294"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="8677" name="__module.model.layers.36.self_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> + <data causal="false" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="6295,attn_output.145"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8678" name="__module.model.layers.36.self_attn/aten::transpose/ScatterElementsUpdate_3" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="8679" name="__module.model.layers.36.self_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6296"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8680" name="Constant_301918" type="Const" version="opset1"> + <data element_type="i64" shape="3" offset="798146608" size="24" /> + <output> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="8681" name="__module.model.layers.36.self_attn/aten::view/Reshape_3" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>3</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6299"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="8682" name="self.model.layers.36.self_attn.o_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 128" offset="5948194936" size="13107200" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8683" name="Convert_386757" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8684" name="self.model.layers.36.self_attn.o_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 1" offset="5961302136" size="102400" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8685" name="Convert_386759" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8686" name="self.model.layers.36.self_attn.o_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8687" name="self.model.layers.36.self_attn.o_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="5120, 40, 1" offset="5961404536" size="409600" /> + <output> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8688" name="self.model.layers.36.self_attn.o_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8689" name="Constant_386764" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="792684080" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="8690" name="Reshape_386765" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="8691" name="__module.model.layers.36.self_attn.o_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="8692" name="__module.model.layers.36.self_attn.o_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6301,6303,hidden_states.1097"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="8693" name="__module.model.layers.36/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6306,6308,6319,hidden_states.1099,hidden_states.1101"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="8694" name="Constant_290417" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 5120" offset="5961814136" size="20480" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="8695" name="Constant_290416" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064860" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8696" name="Constant_290414" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064864" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8697" name="__module.model.layers.36.post_attention_layernorm/aten::pow/Power" type="Power" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6309"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="8698" name="Constant_25316" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64" names="6310"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8699" name="__module.model.layers.36.post_attention_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> + <data keep_dims="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6311,variance.147"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8700" name="Constant_290415" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064876" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8701" name="__module.model.layers.36.post_attention_layernorm/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6312"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8702" name="__module.model.layers.36.post_attention_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8703" name="__module.model.layers.36.post_attention_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6313"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8704" name="__module.model.layers.36.post_attention_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6314,6315,hidden_states.1103,hidden_states.1105"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="8705" name="__module.model.layers.36.post_attention_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6316,6318"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="8706" name="self.model.layers.36.mlp.gate_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 128" offset="5961834616" size="35389440" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8707" name="Convert_385677" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8708" name="self.model.layers.36.mlp.gate_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 1" offset="5997224056" size="276480" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8709" name="Convert_385679" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8710" name="self.model.layers.36.mlp.gate_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8711" name="self.model.layers.36.mlp.gate_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="13824, 40, 1" offset="5997500536" size="1105920" /> + <output> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8712" name="self.model.layers.36.mlp.gate_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8713" name="Constant_385684" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="848558152" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="8714" name="Reshape_385685" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="8715" name="__module.model.layers.36.mlp.gate_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="8716" name="__module.model.layers.36.mlp.gate_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6324,input.73"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="8717" name="__module.model.layers.36.mlp.act_fn/aten::silu/Swish" type="Swish" version="opset4"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="6325"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="8718" name="self.model.layers.36.mlp.up_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 128" offset="5998606456" size="35389440" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8719" name="Convert_385667" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8720" name="self.model.layers.36.mlp.up_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 1" offset="6033995896" size="276480" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8721" name="Convert_385669" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8722" name="self.model.layers.36.mlp.up_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8723" name="self.model.layers.36.mlp.up_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="13824, 40, 1" offset="6034272376" size="1105920" /> + <output> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8724" name="self.model.layers.36.mlp.up_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8725" name="Constant_385674" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="848558152" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="8726" name="Reshape_385675" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="8727" name="__module.model.layers.36.mlp.up_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="8728" name="__module.model.layers.36.mlp.up_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6327"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="8729" name="__module.model.layers.36.mlp/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6328"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="8730" name="self.model.layers.36.mlp.down_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 108, 128" offset="6035378296" size="35389440" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8731" name="Convert_385687" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8732" name="self.model.layers.36.mlp.down_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 108, 1" offset="6070767736" size="276480" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8733" name="Convert_385689" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8734" name="self.model.layers.36.mlp.down_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8735" name="self.model.layers.36.mlp.down_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="5120, 108, 1" offset="6071044216" size="1105920" /> + <output> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8736" name="self.model.layers.36.mlp.down_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8737" name="Constant_385694" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="922101848" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="8738" name="Reshape_385695" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="8739" name="__module.model.layers.36.mlp.down_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="8740" name="__module.model.layers.36.mlp.down_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6330,hidden_states.1107"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="8741" name="__module.model.layers.36/aten::add/Add_1" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6331,6333,6341,6352,hidden_states.1109,hidden_states.1111"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="8742" name="Constant_290421" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 5120" offset="6072150136" size="20480" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="8743" name="Constant_290420" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064860" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8744" name="Constant_290418" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064864" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8745" name="__module.model.layers.37.input_layernorm/aten::pow/Power" type="Power" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6342"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="8746" name="Constant_25390" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64" names="6343"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8747" name="__module.model.layers.37.input_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> + <data keep_dims="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6344,variance.149"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8748" name="Constant_290419" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064876" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8749" name="__module.model.layers.37.input_layernorm/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6345"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8750" name="__module.model.layers.37.input_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8751" name="__module.model.layers.37.input_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6346"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8752" name="__module.model.layers.37.input_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6347,6348,hidden_states.1113,hidden_states.1115"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="8753" name="__module.model.layers.37.input_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6349,6351,hidden_states.1117"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="8754" name="self.model.layers.37.self_attn.q_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 128" offset="6072170616" size="13107200" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8755" name="Convert_386767" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8756" name="self.model.layers.37.self_attn.q_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 1" offset="6085277816" size="102400" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8757" name="Convert_386769" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8758" name="self.model.layers.37.self_attn.q_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8759" name="self.model.layers.37.self_attn.q_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="5120, 40, 1" offset="6085380216" size="409600" /> + <output> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8760" name="self.model.layers.37.self_attn.q_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8761" name="Constant_386774" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="792684080" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="8762" name="Reshape_386775" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="8763" name="__module.model.layers.37.self_attn.q_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="8764" name="__module.model.layers.37.self_attn.q_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="8765" name="self.model.layers.37.self_attn.q_proj.bias" type="Const" version="opset1"> + <data element_type="bf16" shape="5120" offset="6085789816" size="10240" /> + <output> + <port id="0" precision="BF16" names="self.model.layers.37.self_attn.q_proj.bias"> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="8766" name="__module.model.layers.37.self_attn.q_proj/prim::PythonOp/ConvertLike_1" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="BF16"> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="8767" name="__module.model.layers.37.self_attn.q_proj/prim::PythonOp/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6361,query_states.75"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="8768" name="Constant_301919" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="792694336" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="8769" name="__module.model.layers.37.self_attn/aten::view/Reshape" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6369"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8770" name="__module.model.layers.37.self_attn/aten::transpose/ScatterElementsUpdate" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="8771" name="__module.model.layers.37.self_attn/aten::transpose/Transpose" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6370,q.75"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8772" name="__module.model.layers.37.self_attn/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6379"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8773" name="__module.model.layers.37.self_attn/aten::size/ShapeOf_3" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="8774" name="__module.model.layers.37.self_attn/aten::size/Constant_3" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="8775" name="__module.model.layers.37.self_attn/aten::size/Gather_3" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="6380,6385" /> + </output> + </layer> + <layer id="8776" name="__module.model.layers.37.self_attn/aten::floor_divide/Divide_1" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" /> + </output> + </layer> + <layer id="8777" name="__module.model.layers.37.self_attn/aten::floor_divide/Floor_1" type="Floor" version="opset1"> + <input> + <port id="0" precision="I64" /> + </input> + <output> + <port id="1" precision="I64" names="6382,6383,6387,6388" /> + </output> + </layer> + <layer id="8778" name="Constant_221100" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8779" name="__module.model.layers.37.self_attn/aten::slice/Reshape_5" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8780" name="__module.model.layers.37.self_attn/aten::slice/Reshape_1" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694676" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8781" name="__module.model.layers.37.self_attn/aten::slice/Reshape_2" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8782" name="__module.model.layers.37.self_attn/aten::slice/Reshape_3" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8783" name="__module.model.layers.37.self_attn/aten::slice/Slice" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="6389,x2.149"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="8784" name="Constant_290422" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1, 1" offset="792694684" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8785" name="__module.model.layers.37.self_attn/aten::neg/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6390"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="8786" name="__module.model.layers.37.self_attn/aten::slice/Reshape_4" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8787" name="__module.model.layers.37.self_attn/aten::slice/Reshape_6" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8788" name="__module.model.layers.37.self_attn/aten::slice/Reshape_7" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8789" name="__module.model.layers.37.self_attn/aten::slice/Slice_1" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="6384"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="8790" name="__module.model.layers.37.self_attn/aten::cat/Concat" type="Concat" version="opset1"> + <data axis="-1" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6392"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8791" name="__module.model.layers.37.self_attn/aten::mul/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6393"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8792" name="__module.model.layers.37.self_attn/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6394"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8793" name="Constant_341737" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="8794" name="Constant_341730" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="12" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8795" name="Constant_341732" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8796" name="Constant_341734" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="20" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8797" name="Concat_341735" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="8798" name="Broadcast_341738" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32" /> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8799" name="ReadValue_333200" type="ReadValue" version="opset6"> + <data variable_id="past_key_values.37.keypresent.37.key" variable_type="f32" variable_shape="?,8,?,128" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="past_key_values.37.key"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8800" name="Constant_325531" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="8801" name="Gather_325532" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8802" name="self.model.layers.37.self_attn.k_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 128" offset="6085800056" size="2621440" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8803" name="Convert_387727" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8804" name="self.model.layers.37.self_attn.k_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 1" offset="6088421496" size="20480" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8805" name="Convert_387729" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8806" name="self.model.layers.37.self_attn.k_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8807" name="self.model.layers.37.self_attn.k_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="1024, 40, 1" offset="6088441976" size="81920" /> + <output> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8808" name="self.model.layers.37.self_attn.k_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8809" name="Constant_387734" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795418528" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="8810" name="Reshape_387735" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="8811" name="__module.model.layers.37.self_attn.k_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="8812" name="__module.model.layers.37.self_attn.k_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="8813" name="self.model.layers.37.self_attn.k_proj.bias" type="Const" version="opset1"> + <data element_type="bf16" shape="1024" offset="6088523896" size="2048" /> + <output> + <port id="0" precision="BF16" names="self.model.layers.37.self_attn.k_proj.bias"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="8814" name="__module.model.layers.37.self_attn.k_proj/prim::PythonOp/ConvertLike_1" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="BF16"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="8815" name="__module.model.layers.37.self_attn.k_proj/prim::PythonOp/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6364,key_states.153"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="8816" name="Constant_301920" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420592" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="8817" name="__module.model.layers.37.self_attn/aten::view/Reshape_1" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6372"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8818" name="__module.model.layers.37.self_attn/aten::transpose/ScatterElementsUpdate_1" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="8819" name="__module.model.layers.37.self_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6373,k.75"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8820" name="__module.model.layers.37.self_attn/aten::mul/Multiply_2" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6395"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8821" name="__module.model.layers.37.self_attn/aten::size/ShapeOf_5" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="8822" name="__module.model.layers.37.self_attn/aten::size/Constant_5" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="8823" name="__module.model.layers.37.self_attn/aten::size/Gather_5" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="6396,6401" /> + </output> + </layer> + <layer id="8824" name="__module.model.layers.37.self_attn/aten::floor_divide/Divide_3" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" /> + </output> + </layer> + <layer id="8825" name="__module.model.layers.37.self_attn/aten::floor_divide/Floor_3" type="Floor" version="opset1"> + <input> + <port id="0" precision="I64" /> + </input> + <output> + <port id="1" precision="I64" names="6398,6399,6403,6404" /> + </output> + </layer> + <layer id="8826" name="Constant_221101" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8827" name="__module.model.layers.37.self_attn/aten::slice/Reshape_13" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8828" name="__module.model.layers.37.self_attn/aten::slice/Reshape_9" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694676" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8829" name="__module.model.layers.37.self_attn/aten::slice/Reshape_10" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8830" name="__module.model.layers.37.self_attn/aten::slice/Reshape_11" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8831" name="__module.model.layers.37.self_attn/aten::slice/Slice_2" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="6405,x2.151"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="8832" name="Constant_290423" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1, 1" offset="792694684" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8833" name="__module.model.layers.37.self_attn/aten::neg/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6406"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="8834" name="__module.model.layers.37.self_attn/aten::slice/Reshape_12" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8835" name="__module.model.layers.37.self_attn/aten::slice/Reshape_14" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8836" name="__module.model.layers.37.self_attn/aten::slice/Reshape_15" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8837" name="__module.model.layers.37.self_attn/aten::slice/Slice_3" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="6400"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="8838" name="__module.model.layers.37.self_attn/aten::cat/Concat_1" type="Concat" version="opset1"> + <data axis="-1" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6408"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8839" name="__module.model.layers.37.self_attn/aten::mul/Multiply_3" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6409"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8840" name="__module.model.layers.37.self_attn/aten::add/Add_1" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6410"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8841" name="__module.model.layers.37.self_attn/aten::cat/Concat_2" type="Concat" version="opset1"> + <data axis="-2" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="present.37.key"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8842" name="__module.model.layers.37.self_attn/aten::unsqueeze/Unsqueeze_2" type="Unsqueeze" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="FP32" names="6422,6423,6424"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8843" name="__module.model.layers.37.self_attn/aten::size/ShapeOf_6" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="8844" name="Constant_302549" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="938477672" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="8845" name="Constant_302550" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="8846" name="Gather_302551" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="8847" name="Constant_269166" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="795420624" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8848" name="Constant_277486" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795420632" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="8849" name="Constant_277487" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="8850" name="Gather_277488" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="8851" name="__module.model.layers.37.self_attn/prim::ListConstruct/Concat_2" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="3" precision="I64" names="6425"> + <dim>5</dim> + </port> + </output> + </layer> + <layer id="8852" name="__module.model.layers.37.self_attn/aten::expand/Broadcast" type="Broadcast" version="opset3"> + <data mode="bidirectional" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>5</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6426,hidden_states.1121"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8853" name="Constant_301921" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420648" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="8854" name="__module.model.layers.37.self_attn/aten::reshape/Reshape" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6430,key_states.155"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8855" name="Constant_341750" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="8856" name="Constant_341743" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="12" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8857" name="Constant_341745" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8858" name="Constant_341747" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="20" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8859" name="Concat_341748" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="8860" name="Broadcast_341751" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32" /> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8861" name="ReadValue_333202" type="ReadValue" version="opset6"> + <data variable_id="past_key_values.37.valuepresent.37.value" variable_type="f32" variable_shape="?,8,?,128" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="past_key_values.37.value"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8862" name="Constant_325534" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="8863" name="Gather_325535" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8864" name="self.model.layers.37.self_attn.v_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 128" offset="6088525944" size="2621440" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8865" name="Convert_387737" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8866" name="self.model.layers.37.self_attn.v_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 1" offset="6091147384" size="20480" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8867" name="Convert_387739" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8868" name="self.model.layers.37.self_attn.v_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8869" name="self.model.layers.37.self_attn.v_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="1024, 40, 1" offset="6091167864" size="81920" /> + <output> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8870" name="self.model.layers.37.self_attn.v_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8871" name="Constant_387744" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795418528" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="8872" name="Reshape_387745" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="8873" name="__module.model.layers.37.self_attn.v_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="8874" name="__module.model.layers.37.self_attn.v_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="8875" name="self.model.layers.37.self_attn.v_proj.bias" type="Const" version="opset1"> + <data element_type="bf16" shape="1024" offset="6091249784" size="2048" /> + <output> + <port id="0" precision="BF16" names="self.model.layers.37.self_attn.v_proj.bias"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="8876" name="__module.model.layers.37.self_attn.v_proj/prim::PythonOp/ConvertLike_1" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="BF16"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="8877" name="__module.model.layers.37.self_attn.v_proj/prim::PythonOp/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6367,value_states.75"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="8878" name="Constant_301922" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420592" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="8879" name="__module.model.layers.37.self_attn/aten::view/Reshape_2" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6375"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8880" name="__module.model.layers.37.self_attn/aten::transpose/ScatterElementsUpdate_2" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="8881" name="__module.model.layers.37.self_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6376"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8882" name="__module.model.layers.37.self_attn/aten::cat/Concat_3" type="Concat" version="opset1"> + <data axis="-2" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="present.37.value"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8883" name="__module.model.layers.37.self_attn/aten::unsqueeze/Unsqueeze_3" type="Unsqueeze" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="FP32" names="6438,6439,6440"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8884" name="__module.model.layers.37.self_attn/aten::size/ShapeOf_10" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="8885" name="Constant_302307" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8886" name="__module.model.layers.37.self_attn/aten::size/Constant_11" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="8887" name="__module.model.layers.37.self_attn/aten::size/Gather_11" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="6432"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8888" name="Constant_269184" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="795420624" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8889" name="Constant_277496" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795420632" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="8890" name="Constant_277497" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="8891" name="Gather_277498" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="8892" name="__module.model.layers.37.self_attn/prim::ListConstruct/Concat_5" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="4" precision="I64" names="6441"> + <dim>5</dim> + </port> + </output> + </layer> + <layer id="8893" name="__module.model.layers.37.self_attn/aten::expand/Broadcast_1" type="Broadcast" version="opset3"> + <data mode="bidirectional" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>5</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6442,hidden_states.1125"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8894" name="Constant_301923" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420648" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="8895" name="__module.model.layers.37.self_attn/aten::reshape/Reshape_1" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6446"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8896" name="__module.model.layers.37.self_attn/aten::slice/Reshape_60" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8897" name="ShapeOf_300762" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="8898" name="Constant_300763" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694668" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8899" name="Constant_300764" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="8900" name="Gather_300765" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8901" name="ShapeOf_300766" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="8902" name="Constant_300767" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694668" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8903" name="Constant_300768" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="8904" name="Gather_300769" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8905" name="Add_300770" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64" names="6447"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8906" name="__module.model.layers.37.self_attn/aten::slice/Reshape_62" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8907" name="__module.model.layers.37.self_attn/aten::slice/Reshape_63" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8908" name="__module.model.layers.37.self_attn/aten::slice/Slice_15" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="6451"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="8909" name="__module.model.layers.37.self_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> + <data causal="false" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="6452,attn_output.149"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8910" name="__module.model.layers.37.self_attn/aten::transpose/ScatterElementsUpdate_3" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="8911" name="__module.model.layers.37.self_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6453"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8912" name="Constant_301924" type="Const" version="opset1"> + <data element_type="i64" shape="3" offset="798146608" size="24" /> + <output> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="8913" name="__module.model.layers.37.self_attn/aten::view/Reshape_3" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>3</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6456"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="8914" name="self.model.layers.37.self_attn.o_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 128" offset="6091251832" size="13107200" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8915" name="Convert_386777" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8916" name="self.model.layers.37.self_attn.o_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 1" offset="6104359032" size="102400" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8917" name="Convert_386779" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8918" name="self.model.layers.37.self_attn.o_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8919" name="self.model.layers.37.self_attn.o_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="5120, 40, 1" offset="6104461432" size="409600" /> + <output> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8920" name="self.model.layers.37.self_attn.o_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8921" name="Constant_386784" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="792684080" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="8922" name="Reshape_386785" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="8923" name="__module.model.layers.37.self_attn.o_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="8924" name="__module.model.layers.37.self_attn.o_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6458,6460,hidden_states.1127"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="8925" name="__module.model.layers.37/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6463,6465,6476,hidden_states.1129,hidden_states.1131"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="8926" name="Constant_290427" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 5120" offset="6104871032" size="20480" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="8927" name="Constant_290426" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064860" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8928" name="Constant_290424" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064864" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8929" name="__module.model.layers.37.post_attention_layernorm/aten::pow/Power" type="Power" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6466"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="8930" name="Constant_25988" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64" names="6467"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8931" name="__module.model.layers.37.post_attention_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> + <data keep_dims="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6468,variance.151"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8932" name="Constant_290425" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064876" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8933" name="__module.model.layers.37.post_attention_layernorm/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6469"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8934" name="__module.model.layers.37.post_attention_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8935" name="__module.model.layers.37.post_attention_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6470"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8936" name="__module.model.layers.37.post_attention_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6471,6472,hidden_states.1133,hidden_states.1135"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="8937" name="__module.model.layers.37.post_attention_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6473,6475"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="8938" name="self.model.layers.37.mlp.gate_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 128" offset="6104891512" size="35389440" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8939" name="Convert_385707" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8940" name="self.model.layers.37.mlp.gate_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 1" offset="6140280952" size="276480" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8941" name="Convert_385709" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8942" name="self.model.layers.37.mlp.gate_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8943" name="self.model.layers.37.mlp.gate_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="13824, 40, 1" offset="6140557432" size="1105920" /> + <output> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8944" name="self.model.layers.37.mlp.gate_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8945" name="Constant_385714" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="848558152" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="8946" name="Reshape_385715" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="8947" name="__module.model.layers.37.mlp.gate_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="8948" name="__module.model.layers.37.mlp.gate_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6481,input.75"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="8949" name="__module.model.layers.37.mlp.act_fn/aten::silu/Swish" type="Swish" version="opset4"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="6482"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="8950" name="self.model.layers.37.mlp.up_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 128" offset="6141663352" size="35389440" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8951" name="Convert_385697" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8952" name="self.model.layers.37.mlp.up_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 1" offset="6177052792" size="276480" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8953" name="Convert_385699" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8954" name="self.model.layers.37.mlp.up_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8955" name="self.model.layers.37.mlp.up_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="13824, 40, 1" offset="6177329272" size="1105920" /> + <output> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8956" name="self.model.layers.37.mlp.up_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8957" name="Constant_385704" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="848558152" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="8958" name="Reshape_385705" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="8959" name="__module.model.layers.37.mlp.up_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="8960" name="__module.model.layers.37.mlp.up_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6484"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="8961" name="__module.model.layers.37.mlp/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6485"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="8962" name="self.model.layers.37.mlp.down_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 108, 128" offset="6178435192" size="35389440" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8963" name="Convert_385717" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8964" name="self.model.layers.37.mlp.down_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 108, 1" offset="6213824632" size="276480" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8965" name="Convert_385719" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8966" name="self.model.layers.37.mlp.down_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8967" name="self.model.layers.37.mlp.down_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="5120, 108, 1" offset="6214101112" size="1105920" /> + <output> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8968" name="self.model.layers.37.mlp.down_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8969" name="Constant_385724" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="922101848" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="8970" name="Reshape_385725" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="8971" name="__module.model.layers.37.mlp.down_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="8972" name="__module.model.layers.37.mlp.down_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6487,hidden_states.1137"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="8973" name="__module.model.layers.37/aten::add/Add_1" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6488,6490,6498,6509,hidden_states.1139,hidden_states.1141"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="8974" name="Constant_290431" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 5120" offset="6215207032" size="20480" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="8975" name="Constant_290430" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064860" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8976" name="Constant_290428" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064864" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8977" name="__module.model.layers.38.input_layernorm/aten::pow/Power" type="Power" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6499"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="8978" name="Constant_26062" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64" names="6500"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8979" name="__module.model.layers.38.input_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> + <data keep_dims="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6501,variance.153"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8980" name="Constant_290429" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064876" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8981" name="__module.model.layers.38.input_layernorm/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6502"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8982" name="__module.model.layers.38.input_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8983" name="__module.model.layers.38.input_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6503"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8984" name="__module.model.layers.38.input_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6504,6505,hidden_states.1143,hidden_states.1145"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="8985" name="__module.model.layers.38.input_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6506,6508,hidden_states.1147"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="8986" name="self.model.layers.38.self_attn.q_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 128" offset="6215227512" size="13107200" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8987" name="Convert_386787" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8988" name="self.model.layers.38.self_attn.q_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 1" offset="6228334712" size="102400" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8989" name="Convert_386789" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8990" name="self.model.layers.38.self_attn.q_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8991" name="self.model.layers.38.self_attn.q_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="5120, 40, 1" offset="6228437112" size="409600" /> + <output> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="8992" name="self.model.layers.38.self_attn.q_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="8993" name="Constant_386794" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="792684080" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="8994" name="Reshape_386795" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="8995" name="__module.model.layers.38.self_attn.q_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="8996" name="__module.model.layers.38.self_attn.q_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="8997" name="self.model.layers.38.self_attn.q_proj.bias" type="Const" version="opset1"> + <data element_type="bf16" shape="5120" offset="6228846712" size="10240" /> + <output> + <port id="0" precision="BF16" names="self.model.layers.38.self_attn.q_proj.bias"> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="8998" name="__module.model.layers.38.self_attn.q_proj/prim::PythonOp/ConvertLike_1" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="BF16"> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="8999" name="__module.model.layers.38.self_attn.q_proj/prim::PythonOp/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6518,query_states.77"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="9000" name="Constant_301925" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="792694336" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="9001" name="__module.model.layers.38.self_attn/aten::view/Reshape" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6526"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9002" name="__module.model.layers.38.self_attn/aten::transpose/ScatterElementsUpdate" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="9003" name="__module.model.layers.38.self_attn/aten::transpose/Transpose" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6527,q.77"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9004" name="__module.model.layers.38.self_attn/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6536"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9005" name="__module.model.layers.38.self_attn/aten::size/ShapeOf_3" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="9006" name="__module.model.layers.38.self_attn/aten::size/Constant_3" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="9007" name="__module.model.layers.38.self_attn/aten::size/Gather_3" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="6537,6542" /> + </output> + </layer> + <layer id="9008" name="__module.model.layers.38.self_attn/aten::floor_divide/Divide_1" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" /> + </output> + </layer> + <layer id="9009" name="__module.model.layers.38.self_attn/aten::floor_divide/Floor_1" type="Floor" version="opset1"> + <input> + <port id="0" precision="I64" /> + </input> + <output> + <port id="1" precision="I64" names="6539,6540,6544,6545" /> + </output> + </layer> + <layer id="9010" name="Constant_221115" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9011" name="__module.model.layers.38.self_attn/aten::slice/Reshape_5" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9012" name="__module.model.layers.38.self_attn/aten::slice/Reshape_1" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694676" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9013" name="__module.model.layers.38.self_attn/aten::slice/Reshape_2" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9014" name="__module.model.layers.38.self_attn/aten::slice/Reshape_3" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9015" name="__module.model.layers.38.self_attn/aten::slice/Slice" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="6546,x2.153"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="9016" name="Constant_290432" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1, 1" offset="792694684" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9017" name="__module.model.layers.38.self_attn/aten::neg/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6547"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="9018" name="__module.model.layers.38.self_attn/aten::slice/Reshape_4" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9019" name="__module.model.layers.38.self_attn/aten::slice/Reshape_6" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9020" name="__module.model.layers.38.self_attn/aten::slice/Reshape_7" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9021" name="__module.model.layers.38.self_attn/aten::slice/Slice_1" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="6541"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="9022" name="__module.model.layers.38.self_attn/aten::cat/Concat" type="Concat" version="opset1"> + <data axis="-1" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6549"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9023" name="__module.model.layers.38.self_attn/aten::mul/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6550"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9024" name="__module.model.layers.38.self_attn/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6551"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9025" name="Constant_341763" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="9026" name="Constant_341756" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="12" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9027" name="Constant_341758" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9028" name="Constant_341760" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="20" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9029" name="Concat_341761" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="9030" name="Broadcast_341764" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32" /> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9031" name="ReadValue_333204" type="ReadValue" version="opset6"> + <data variable_id="past_key_values.38.keypresent.38.key" variable_type="f32" variable_shape="?,8,?,128" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="past_key_values.38.key"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9032" name="Constant_325537" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="9033" name="Gather_325538" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9034" name="self.model.layers.38.self_attn.k_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 128" offset="6228856952" size="2621440" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9035" name="Convert_387747" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9036" name="self.model.layers.38.self_attn.k_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 1" offset="6231478392" size="20480" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9037" name="Convert_387749" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9038" name="self.model.layers.38.self_attn.k_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9039" name="self.model.layers.38.self_attn.k_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="1024, 40, 1" offset="6231498872" size="81920" /> + <output> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9040" name="self.model.layers.38.self_attn.k_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9041" name="Constant_387754" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795418528" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="9042" name="Reshape_387755" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="9043" name="__module.model.layers.38.self_attn.k_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="9044" name="__module.model.layers.38.self_attn.k_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="9045" name="self.model.layers.38.self_attn.k_proj.bias" type="Const" version="opset1"> + <data element_type="bf16" shape="1024" offset="6231580792" size="2048" /> + <output> + <port id="0" precision="BF16" names="self.model.layers.38.self_attn.k_proj.bias"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="9046" name="__module.model.layers.38.self_attn.k_proj/prim::PythonOp/ConvertLike_1" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="BF16"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="9047" name="__module.model.layers.38.self_attn.k_proj/prim::PythonOp/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6521,key_states.157"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="9048" name="Constant_301926" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420592" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="9049" name="__module.model.layers.38.self_attn/aten::view/Reshape_1" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6529"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9050" name="__module.model.layers.38.self_attn/aten::transpose/ScatterElementsUpdate_1" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="9051" name="__module.model.layers.38.self_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6530,k.77"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9052" name="__module.model.layers.38.self_attn/aten::mul/Multiply_2" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6552"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9053" name="__module.model.layers.38.self_attn/aten::size/ShapeOf_5" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="9054" name="__module.model.layers.38.self_attn/aten::size/Constant_5" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="9055" name="__module.model.layers.38.self_attn/aten::size/Gather_5" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="6553,6558" /> + </output> + </layer> + <layer id="9056" name="__module.model.layers.38.self_attn/aten::floor_divide/Divide_3" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" /> + </output> + </layer> + <layer id="9057" name="__module.model.layers.38.self_attn/aten::floor_divide/Floor_3" type="Floor" version="opset1"> + <input> + <port id="0" precision="I64" /> + </input> + <output> + <port id="1" precision="I64" names="6555,6556,6560,6561" /> + </output> + </layer> + <layer id="9058" name="Constant_221116" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9059" name="__module.model.layers.38.self_attn/aten::slice/Reshape_13" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9060" name="__module.model.layers.38.self_attn/aten::slice/Reshape_9" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694676" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9061" name="__module.model.layers.38.self_attn/aten::slice/Reshape_10" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9062" name="__module.model.layers.38.self_attn/aten::slice/Reshape_11" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9063" name="__module.model.layers.38.self_attn/aten::slice/Slice_2" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="6562,x2.155"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="9064" name="Constant_290433" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1, 1" offset="792694684" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9065" name="__module.model.layers.38.self_attn/aten::neg/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6563"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="9066" name="__module.model.layers.38.self_attn/aten::slice/Reshape_12" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9067" name="__module.model.layers.38.self_attn/aten::slice/Reshape_14" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9068" name="__module.model.layers.38.self_attn/aten::slice/Reshape_15" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9069" name="__module.model.layers.38.self_attn/aten::slice/Slice_3" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="6557"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="9070" name="__module.model.layers.38.self_attn/aten::cat/Concat_1" type="Concat" version="opset1"> + <data axis="-1" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6565"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9071" name="__module.model.layers.38.self_attn/aten::mul/Multiply_3" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6566"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9072" name="__module.model.layers.38.self_attn/aten::add/Add_1" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6567"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9073" name="__module.model.layers.38.self_attn/aten::cat/Concat_2" type="Concat" version="opset1"> + <data axis="-2" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="present.38.key"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9074" name="__module.model.layers.38.self_attn/aten::unsqueeze/Unsqueeze_2" type="Unsqueeze" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="FP32" names="6579,6580,6581"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9075" name="__module.model.layers.38.self_attn/aten::size/ShapeOf_6" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="9076" name="Constant_302554" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="938477672" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="9077" name="Constant_302555" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="9078" name="Gather_302556" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="9079" name="Constant_269202" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="795420624" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9080" name="Constant_277521" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795420632" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="9081" name="Constant_277522" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="9082" name="Gather_277523" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="9083" name="__module.model.layers.38.self_attn/prim::ListConstruct/Concat_2" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="3" precision="I64" names="6582"> + <dim>5</dim> + </port> + </output> + </layer> + <layer id="9084" name="__module.model.layers.38.self_attn/aten::expand/Broadcast" type="Broadcast" version="opset3"> + <data mode="bidirectional" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>5</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6583,hidden_states.1151"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9085" name="Constant_301927" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420648" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="9086" name="__module.model.layers.38.self_attn/aten::reshape/Reshape" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6587,key_states.159"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9087" name="Constant_341776" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="9088" name="Constant_341769" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="12" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9089" name="Constant_341771" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9090" name="Constant_341773" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="20" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9091" name="Concat_341774" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="9092" name="Broadcast_341777" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32" /> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9093" name="ReadValue_333206" type="ReadValue" version="opset6"> + <data variable_id="past_key_values.38.valuepresent.38.value" variable_type="f32" variable_shape="?,8,?,128" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="past_key_values.38.value"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9094" name="Constant_325540" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="9095" name="Gather_325541" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9096" name="self.model.layers.38.self_attn.v_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 128" offset="6231582840" size="2621440" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9097" name="Convert_387757" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9098" name="self.model.layers.38.self_attn.v_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 1" offset="6234204280" size="20480" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9099" name="Convert_387759" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9100" name="self.model.layers.38.self_attn.v_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9101" name="self.model.layers.38.self_attn.v_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="1024, 40, 1" offset="6234224760" size="81920" /> + <output> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9102" name="self.model.layers.38.self_attn.v_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9103" name="Constant_387764" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795418528" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="9104" name="Reshape_387765" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="9105" name="__module.model.layers.38.self_attn.v_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="9106" name="__module.model.layers.38.self_attn.v_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="9107" name="self.model.layers.38.self_attn.v_proj.bias" type="Const" version="opset1"> + <data element_type="bf16" shape="1024" offset="6234306680" size="2048" /> + <output> + <port id="0" precision="BF16" names="self.model.layers.38.self_attn.v_proj.bias"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="9108" name="__module.model.layers.38.self_attn.v_proj/prim::PythonOp/ConvertLike_1" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="BF16"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="9109" name="__module.model.layers.38.self_attn.v_proj/prim::PythonOp/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6524,value_states.77"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="9110" name="Constant_301928" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420592" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="9111" name="__module.model.layers.38.self_attn/aten::view/Reshape_2" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6532"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9112" name="__module.model.layers.38.self_attn/aten::transpose/ScatterElementsUpdate_2" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="9113" name="__module.model.layers.38.self_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6533"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9114" name="__module.model.layers.38.self_attn/aten::cat/Concat_3" type="Concat" version="opset1"> + <data axis="-2" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="present.38.value"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9115" name="__module.model.layers.38.self_attn/aten::unsqueeze/Unsqueeze_3" type="Unsqueeze" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="FP32" names="6595,6596,6597"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9116" name="__module.model.layers.38.self_attn/aten::size/ShapeOf_10" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="9117" name="Constant_302313" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9118" name="__module.model.layers.38.self_attn/aten::size/Constant_11" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="9119" name="__module.model.layers.38.self_attn/aten::size/Gather_11" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="6589"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9120" name="Constant_269220" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="795420624" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9121" name="Constant_277531" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795420632" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="9122" name="Constant_277532" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="9123" name="Gather_277533" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="9124" name="__module.model.layers.38.self_attn/prim::ListConstruct/Concat_5" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="4" precision="I64" names="6598"> + <dim>5</dim> + </port> + </output> + </layer> + <layer id="9125" name="__module.model.layers.38.self_attn/aten::expand/Broadcast_1" type="Broadcast" version="opset3"> + <data mode="bidirectional" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>5</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6599,hidden_states.1155"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9126" name="Constant_301929" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420648" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="9127" name="__module.model.layers.38.self_attn/aten::reshape/Reshape_1" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6603"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9128" name="__module.model.layers.38.self_attn/aten::slice/Reshape_60" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9129" name="ShapeOf_300848" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="9130" name="Constant_300849" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694668" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9131" name="Constant_300850" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="9132" name="Gather_300851" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9133" name="ShapeOf_300852" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="9134" name="Constant_300853" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694668" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9135" name="Constant_300854" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="9136" name="Gather_300855" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9137" name="Add_300856" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64" names="6604"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9138" name="__module.model.layers.38.self_attn/aten::slice/Reshape_62" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9139" name="__module.model.layers.38.self_attn/aten::slice/Reshape_63" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9140" name="__module.model.layers.38.self_attn/aten::slice/Slice_15" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="6608"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="9141" name="__module.model.layers.38.self_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> + <data causal="false" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="6609,attn_output.153"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9142" name="__module.model.layers.38.self_attn/aten::transpose/ScatterElementsUpdate_3" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="9143" name="__module.model.layers.38.self_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6610"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9144" name="Constant_301930" type="Const" version="opset1"> + <data element_type="i64" shape="3" offset="798146608" size="24" /> + <output> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="9145" name="__module.model.layers.38.self_attn/aten::view/Reshape_3" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>3</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6613"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="9146" name="self.model.layers.38.self_attn.o_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 128" offset="6234308728" size="13107200" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9147" name="Convert_386797" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9148" name="self.model.layers.38.self_attn.o_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 1" offset="6247415928" size="102400" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9149" name="Convert_386799" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9150" name="self.model.layers.38.self_attn.o_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9151" name="self.model.layers.38.self_attn.o_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="5120, 40, 1" offset="6247518328" size="409600" /> + <output> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9152" name="self.model.layers.38.self_attn.o_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9153" name="Constant_386804" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="792684080" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="9154" name="Reshape_386805" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="9155" name="__module.model.layers.38.self_attn.o_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="9156" name="__module.model.layers.38.self_attn.o_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6615,6617,hidden_states.1157"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="9157" name="__module.model.layers.38/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6620,6622,6633,hidden_states.1159,hidden_states.1161"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="9158" name="Constant_290437" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 5120" offset="6247927928" size="20480" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="9159" name="Constant_290436" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064860" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9160" name="Constant_290434" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064864" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9161" name="__module.model.layers.38.post_attention_layernorm/aten::pow/Power" type="Power" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6623"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="9162" name="Constant_26660" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64" names="6624"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9163" name="__module.model.layers.38.post_attention_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> + <data keep_dims="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6625,variance.155"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9164" name="Constant_290435" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064876" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9165" name="__module.model.layers.38.post_attention_layernorm/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6626"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9166" name="__module.model.layers.38.post_attention_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9167" name="__module.model.layers.38.post_attention_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6627"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9168" name="__module.model.layers.38.post_attention_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6628,6629,hidden_states.1163,hidden_states.1165"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="9169" name="__module.model.layers.38.post_attention_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6630,6632"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="9170" name="self.model.layers.38.mlp.gate_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 128" offset="6247948408" size="35389440" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9171" name="Convert_385737" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9172" name="self.model.layers.38.mlp.gate_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 1" offset="6283337848" size="276480" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9173" name="Convert_385739" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9174" name="self.model.layers.38.mlp.gate_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9175" name="self.model.layers.38.mlp.gate_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="13824, 40, 1" offset="6283614328" size="1105920" /> + <output> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9176" name="self.model.layers.38.mlp.gate_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9177" name="Constant_385744" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="848558152" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="9178" name="Reshape_385745" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="9179" name="__module.model.layers.38.mlp.gate_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="9180" name="__module.model.layers.38.mlp.gate_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6638,input.77"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="9181" name="__module.model.layers.38.mlp.act_fn/aten::silu/Swish" type="Swish" version="opset4"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="6639"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="9182" name="self.model.layers.38.mlp.up_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 128" offset="6284720248" size="35389440" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9183" name="Convert_385727" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9184" name="self.model.layers.38.mlp.up_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 1" offset="6320109688" size="276480" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9185" name="Convert_385729" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9186" name="self.model.layers.38.mlp.up_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9187" name="self.model.layers.38.mlp.up_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="13824, 40, 1" offset="6320386168" size="1105920" /> + <output> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9188" name="self.model.layers.38.mlp.up_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9189" name="Constant_385734" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="848558152" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="9190" name="Reshape_385735" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="9191" name="__module.model.layers.38.mlp.up_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="9192" name="__module.model.layers.38.mlp.up_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6641"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="9193" name="__module.model.layers.38.mlp/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6642"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="9194" name="self.model.layers.38.mlp.down_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 108, 128" offset="6321492088" size="35389440" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9195" name="Convert_385747" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9196" name="self.model.layers.38.mlp.down_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 108, 1" offset="6356881528" size="276480" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9197" name="Convert_385749" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9198" name="self.model.layers.38.mlp.down_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9199" name="self.model.layers.38.mlp.down_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="5120, 108, 1" offset="6357158008" size="1105920" /> + <output> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9200" name="self.model.layers.38.mlp.down_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9201" name="Constant_385754" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="922101848" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="9202" name="Reshape_385755" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="9203" name="__module.model.layers.38.mlp.down_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="9204" name="__module.model.layers.38.mlp.down_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6644,hidden_states.1167"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="9205" name="__module.model.layers.38/aten::add/Add_1" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6645,6647,6655,6666,hidden_states.1169,hidden_states.1171"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="9206" name="Constant_290441" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 5120" offset="6358263928" size="20480" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="9207" name="Constant_290440" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064860" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9208" name="Constant_290438" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064864" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9209" name="__module.model.layers.39.input_layernorm/aten::pow/Power" type="Power" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6656"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="9210" name="Constant_26734" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64" names="6657"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9211" name="__module.model.layers.39.input_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> + <data keep_dims="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6658,variance.157"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9212" name="Constant_290439" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064876" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9213" name="__module.model.layers.39.input_layernorm/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6659"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9214" name="__module.model.layers.39.input_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9215" name="__module.model.layers.39.input_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6660"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9216" name="__module.model.layers.39.input_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6661,6662,hidden_states.1173,hidden_states.1175"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="9217" name="__module.model.layers.39.input_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6663,6665,hidden_states.1177"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="9218" name="self.model.layers.39.self_attn.q_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 128" offset="6358284408" size="13107200" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9219" name="Convert_386807" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9220" name="self.model.layers.39.self_attn.q_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 1" offset="6371391608" size="102400" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9221" name="Convert_386809" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9222" name="self.model.layers.39.self_attn.q_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9223" name="self.model.layers.39.self_attn.q_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="5120, 40, 1" offset="6371494008" size="409600" /> + <output> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9224" name="self.model.layers.39.self_attn.q_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9225" name="Constant_386814" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="792684080" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="9226" name="Reshape_386815" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="9227" name="__module.model.layers.39.self_attn.q_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="9228" name="__module.model.layers.39.self_attn.q_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="9229" name="self.model.layers.39.self_attn.q_proj.bias" type="Const" version="opset1"> + <data element_type="bf16" shape="5120" offset="6371903608" size="10240" /> + <output> + <port id="0" precision="BF16" names="self.model.layers.39.self_attn.q_proj.bias"> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="9230" name="__module.model.layers.39.self_attn.q_proj/prim::PythonOp/ConvertLike_1" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="BF16"> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="9231" name="__module.model.layers.39.self_attn.q_proj/prim::PythonOp/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6675,query_states.79"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="9232" name="Constant_301931" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="792694336" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="9233" name="__module.model.layers.39.self_attn/aten::view/Reshape" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6683"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9234" name="__module.model.layers.39.self_attn/aten::transpose/ScatterElementsUpdate" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="9235" name="__module.model.layers.39.self_attn/aten::transpose/Transpose" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6684,q.79"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9236" name="__module.model.layers.39.self_attn/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6693"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9237" name="__module.model.layers.39.self_attn/aten::size/ShapeOf_3" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="9238" name="__module.model.layers.39.self_attn/aten::size/Constant_3" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="9239" name="__module.model.layers.39.self_attn/aten::size/Gather_3" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="6694,6699" /> + </output> + </layer> + <layer id="9240" name="__module.model.layers.39.self_attn/aten::floor_divide/Divide_1" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" /> + </output> + </layer> + <layer id="9241" name="__module.model.layers.39.self_attn/aten::floor_divide/Floor_1" type="Floor" version="opset1"> + <input> + <port id="0" precision="I64" /> + </input> + <output> + <port id="1" precision="I64" names="6696,6697,6701,6702" /> + </output> + </layer> + <layer id="9242" name="Constant_221130" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9243" name="__module.model.layers.39.self_attn/aten::slice/Reshape_5" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9244" name="__module.model.layers.39.self_attn/aten::slice/Reshape_1" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694676" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9245" name="__module.model.layers.39.self_attn/aten::slice/Reshape_2" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9246" name="__module.model.layers.39.self_attn/aten::slice/Reshape_3" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9247" name="__module.model.layers.39.self_attn/aten::slice/Slice" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="6703,x2.157"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="9248" name="Constant_290442" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1, 1" offset="792694684" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9249" name="__module.model.layers.39.self_attn/aten::neg/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6704"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="9250" name="__module.model.layers.39.self_attn/aten::slice/Reshape_4" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9251" name="__module.model.layers.39.self_attn/aten::slice/Reshape_6" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9252" name="__module.model.layers.39.self_attn/aten::slice/Reshape_7" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9253" name="__module.model.layers.39.self_attn/aten::slice/Slice_1" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="6698"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="9254" name="__module.model.layers.39.self_attn/aten::cat/Concat" type="Concat" version="opset1"> + <data axis="-1" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6706"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9255" name="__module.model.layers.39.self_attn/aten::mul/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6707"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9256" name="__module.model.layers.39.self_attn/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6708"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9257" name="Constant_341789" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="9258" name="Constant_341782" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="12" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9259" name="Constant_341784" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9260" name="Constant_341786" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="20" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9261" name="Concat_341787" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="9262" name="Broadcast_341790" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32" /> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9263" name="ReadValue_333208" type="ReadValue" version="opset6"> + <data variable_id="past_key_values.39.keypresent.39.key" variable_type="f32" variable_shape="?,8,?,128" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="past_key_values.39.key"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9264" name="Constant_325543" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="9265" name="Gather_325544" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9266" name="self.model.layers.39.self_attn.k_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 128" offset="6371913848" size="2621440" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9267" name="Convert_387767" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9268" name="self.model.layers.39.self_attn.k_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 1" offset="6374535288" size="20480" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9269" name="Convert_387769" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9270" name="self.model.layers.39.self_attn.k_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9271" name="self.model.layers.39.self_attn.k_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="1024, 40, 1" offset="6374555768" size="81920" /> + <output> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9272" name="self.model.layers.39.self_attn.k_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9273" name="Constant_387774" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795418528" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="9274" name="Reshape_387775" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="9275" name="__module.model.layers.39.self_attn.k_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="9276" name="__module.model.layers.39.self_attn.k_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="9277" name="self.model.layers.39.self_attn.k_proj.bias" type="Const" version="opset1"> + <data element_type="bf16" shape="1024" offset="6374637688" size="2048" /> + <output> + <port id="0" precision="BF16" names="self.model.layers.39.self_attn.k_proj.bias"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="9278" name="__module.model.layers.39.self_attn.k_proj/prim::PythonOp/ConvertLike_1" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="BF16"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="9279" name="__module.model.layers.39.self_attn.k_proj/prim::PythonOp/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6678,key_states.161"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="9280" name="Constant_301932" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420592" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="9281" name="__module.model.layers.39.self_attn/aten::view/Reshape_1" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6686"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9282" name="__module.model.layers.39.self_attn/aten::transpose/ScatterElementsUpdate_1" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="9283" name="__module.model.layers.39.self_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6687,k.79"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9284" name="__module.model.layers.39.self_attn/aten::mul/Multiply_2" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6709"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9285" name="__module.model.layers.39.self_attn/aten::size/ShapeOf_5" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="9286" name="__module.model.layers.39.self_attn/aten::size/Constant_5" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="9287" name="__module.model.layers.39.self_attn/aten::size/Gather_5" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="6710,6715" /> + </output> + </layer> + <layer id="9288" name="__module.model.layers.39.self_attn/aten::floor_divide/Divide_3" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" /> + </output> + </layer> + <layer id="9289" name="__module.model.layers.39.self_attn/aten::floor_divide/Floor_3" type="Floor" version="opset1"> + <input> + <port id="0" precision="I64" /> + </input> + <output> + <port id="1" precision="I64" names="6712,6713,6717,6718" /> + </output> + </layer> + <layer id="9290" name="Constant_221131" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9291" name="__module.model.layers.39.self_attn/aten::slice/Reshape_13" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9292" name="__module.model.layers.39.self_attn/aten::slice/Reshape_9" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694676" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9293" name="__module.model.layers.39.self_attn/aten::slice/Reshape_10" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9294" name="__module.model.layers.39.self_attn/aten::slice/Reshape_11" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9295" name="__module.model.layers.39.self_attn/aten::slice/Slice_2" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="6719,x2.159"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="9296" name="Constant_290443" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1, 1" offset="792694684" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9297" name="__module.model.layers.39.self_attn/aten::neg/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6720"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="9298" name="__module.model.layers.39.self_attn/aten::slice/Reshape_12" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9299" name="__module.model.layers.39.self_attn/aten::slice/Reshape_14" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9300" name="__module.model.layers.39.self_attn/aten::slice/Reshape_15" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9301" name="__module.model.layers.39.self_attn/aten::slice/Slice_3" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="6714"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="9302" name="__module.model.layers.39.self_attn/aten::cat/Concat_1" type="Concat" version="opset1"> + <data axis="-1" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6722"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9303" name="__module.model.layers.39.self_attn/aten::mul/Multiply_3" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6723"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9304" name="__module.model.layers.39.self_attn/aten::add/Add_1" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6724"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9305" name="__module.model.layers.39.self_attn/aten::cat/Concat_2" type="Concat" version="opset1"> + <data axis="-2" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="present.39.key"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9306" name="__module.model.layers.39.self_attn/aten::unsqueeze/Unsqueeze_2" type="Unsqueeze" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="FP32" names="6736,6737,6738"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9307" name="__module.model.layers.39.self_attn/aten::size/ShapeOf_6" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="9308" name="Constant_302559" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="938477672" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="9309" name="Constant_302560" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="9310" name="Gather_302561" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="9311" name="Constant_269238" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="795420624" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9312" name="Constant_277556" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795420632" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="9313" name="Constant_277557" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="9314" name="Gather_277558" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="9315" name="__module.model.layers.39.self_attn/prim::ListConstruct/Concat_2" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="3" precision="I64" names="6739"> + <dim>5</dim> + </port> + </output> + </layer> + <layer id="9316" name="__module.model.layers.39.self_attn/aten::expand/Broadcast" type="Broadcast" version="opset3"> + <data mode="bidirectional" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>5</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6740,hidden_states.1181"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9317" name="Constant_301933" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420648" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="9318" name="__module.model.layers.39.self_attn/aten::reshape/Reshape" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6744,key_states.163"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9319" name="Constant_341802" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="9320" name="Constant_341795" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="12" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9321" name="Constant_341797" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9322" name="Constant_341799" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="20" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9323" name="Concat_341800" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="9324" name="Broadcast_341803" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32" /> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9325" name="ReadValue_333210" type="ReadValue" version="opset6"> + <data variable_id="past_key_values.39.valuepresent.39.value" variable_type="f32" variable_shape="?,8,?,128" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="past_key_values.39.value"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9326" name="Constant_325546" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="9327" name="Gather_325547" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9328" name="self.model.layers.39.self_attn.v_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 128" offset="6374639736" size="2621440" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9329" name="Convert_387777" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9330" name="self.model.layers.39.self_attn.v_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 1" offset="6377261176" size="20480" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9331" name="Convert_387779" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9332" name="self.model.layers.39.self_attn.v_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9333" name="self.model.layers.39.self_attn.v_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="1024, 40, 1" offset="6377281656" size="81920" /> + <output> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9334" name="self.model.layers.39.self_attn.v_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9335" name="Constant_387784" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795418528" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="9336" name="Reshape_387785" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="9337" name="__module.model.layers.39.self_attn.v_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="9338" name="__module.model.layers.39.self_attn.v_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="9339" name="self.model.layers.39.self_attn.v_proj.bias" type="Const" version="opset1"> + <data element_type="bf16" shape="1024" offset="6377363576" size="2048" /> + <output> + <port id="0" precision="BF16" names="self.model.layers.39.self_attn.v_proj.bias"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="9340" name="__module.model.layers.39.self_attn.v_proj/prim::PythonOp/ConvertLike_1" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="BF16"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="9341" name="__module.model.layers.39.self_attn.v_proj/prim::PythonOp/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6681,value_states.79"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="9342" name="Constant_301934" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420592" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="9343" name="__module.model.layers.39.self_attn/aten::view/Reshape_2" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6689"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9344" name="__module.model.layers.39.self_attn/aten::transpose/ScatterElementsUpdate_2" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="9345" name="__module.model.layers.39.self_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6690"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9346" name="__module.model.layers.39.self_attn/aten::cat/Concat_3" type="Concat" version="opset1"> + <data axis="-2" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="present.39.value"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9347" name="__module.model.layers.39.self_attn/aten::unsqueeze/Unsqueeze_3" type="Unsqueeze" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="FP32" names="6752,6753,6754"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9348" name="__module.model.layers.39.self_attn/aten::size/ShapeOf_10" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="9349" name="Constant_302319" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9350" name="__module.model.layers.39.self_attn/aten::size/Constant_11" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="9351" name="__module.model.layers.39.self_attn/aten::size/Gather_11" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="6746"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9352" name="Constant_269256" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="795420624" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9353" name="Constant_277566" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795420632" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="9354" name="Constant_277567" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="9355" name="Gather_277568" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="9356" name="__module.model.layers.39.self_attn/prim::ListConstruct/Concat_5" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="4" precision="I64" names="6755"> + <dim>5</dim> + </port> + </output> + </layer> + <layer id="9357" name="__module.model.layers.39.self_attn/aten::expand/Broadcast_1" type="Broadcast" version="opset3"> + <data mode="bidirectional" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>5</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6756,hidden_states.1185"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9358" name="Constant_301935" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420648" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="9359" name="__module.model.layers.39.self_attn/aten::reshape/Reshape_1" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6760"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9360" name="__module.model.layers.39.self_attn/aten::slice/Reshape_60" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9361" name="ShapeOf_300934" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="9362" name="Constant_300935" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694668" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9363" name="Constant_300936" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="9364" name="Gather_300937" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9365" name="ShapeOf_300938" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="9366" name="Constant_300939" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694668" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9367" name="Constant_300940" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="9368" name="Gather_300941" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9369" name="Add_300942" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64" names="6761"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9370" name="__module.model.layers.39.self_attn/aten::slice/Reshape_62" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9371" name="__module.model.layers.39.self_attn/aten::slice/Reshape_63" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9372" name="__module.model.layers.39.self_attn/aten::slice/Slice_15" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="6765"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="9373" name="__module.model.layers.39.self_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> + <data causal="false" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="6766,attn_output.157"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9374" name="__module.model.layers.39.self_attn/aten::transpose/ScatterElementsUpdate_3" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="9375" name="__module.model.layers.39.self_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6767"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9376" name="Constant_301936" type="Const" version="opset1"> + <data element_type="i64" shape="3" offset="798146608" size="24" /> + <output> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="9377" name="__module.model.layers.39.self_attn/aten::view/Reshape_3" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>3</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6770"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="9378" name="self.model.layers.39.self_attn.o_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 128" offset="6377365624" size="13107200" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9379" name="Convert_386817" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9380" name="self.model.layers.39.self_attn.o_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 1" offset="6390472824" size="102400" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9381" name="Convert_386819" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9382" name="self.model.layers.39.self_attn.o_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9383" name="self.model.layers.39.self_attn.o_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="5120, 40, 1" offset="6390575224" size="409600" /> + <output> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9384" name="self.model.layers.39.self_attn.o_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9385" name="Constant_386824" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="792684080" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="9386" name="Reshape_386825" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="9387" name="__module.model.layers.39.self_attn.o_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="9388" name="__module.model.layers.39.self_attn.o_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6772,6774,hidden_states.1187"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="9389" name="__module.model.layers.39/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6777,6779,6790,hidden_states.1189,hidden_states.1191"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="9390" name="Constant_290447" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 5120" offset="6390984824" size="20480" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="9391" name="Constant_290446" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064860" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9392" name="Constant_290444" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064864" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9393" name="__module.model.layers.39.post_attention_layernorm/aten::pow/Power" type="Power" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6780"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="9394" name="Constant_27332" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64" names="6781"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9395" name="__module.model.layers.39.post_attention_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> + <data keep_dims="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6782,variance.159"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9396" name="Constant_290445" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064876" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9397" name="__module.model.layers.39.post_attention_layernorm/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6783"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9398" name="__module.model.layers.39.post_attention_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9399" name="__module.model.layers.39.post_attention_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6784"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9400" name="__module.model.layers.39.post_attention_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6785,6786,hidden_states.1193,hidden_states.1195"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="9401" name="__module.model.layers.39.post_attention_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6787,6789"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="9402" name="self.model.layers.39.mlp.gate_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 128" offset="6391005304" size="35389440" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9403" name="Convert_385767" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9404" name="self.model.layers.39.mlp.gate_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 1" offset="6426394744" size="276480" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9405" name="Convert_385769" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9406" name="self.model.layers.39.mlp.gate_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9407" name="self.model.layers.39.mlp.gate_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="13824, 40, 1" offset="6426671224" size="1105920" /> + <output> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9408" name="self.model.layers.39.mlp.gate_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9409" name="Constant_385774" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="848558152" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="9410" name="Reshape_385775" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="9411" name="__module.model.layers.39.mlp.gate_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="9412" name="__module.model.layers.39.mlp.gate_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6795,input.79"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="9413" name="__module.model.layers.39.mlp.act_fn/aten::silu/Swish" type="Swish" version="opset4"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="6796"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="9414" name="self.model.layers.39.mlp.up_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 128" offset="6427777144" size="35389440" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9415" name="Convert_385757" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9416" name="self.model.layers.39.mlp.up_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 1" offset="6463166584" size="276480" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9417" name="Convert_385759" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9418" name="self.model.layers.39.mlp.up_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9419" name="self.model.layers.39.mlp.up_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="13824, 40, 1" offset="6463443064" size="1105920" /> + <output> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9420" name="self.model.layers.39.mlp.up_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9421" name="Constant_385764" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="848558152" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="9422" name="Reshape_385765" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="9423" name="__module.model.layers.39.mlp.up_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="9424" name="__module.model.layers.39.mlp.up_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6798"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="9425" name="__module.model.layers.39.mlp/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6799"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="9426" name="self.model.layers.39.mlp.down_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 108, 128" offset="6464548984" size="35389440" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9427" name="Convert_385777" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9428" name="self.model.layers.39.mlp.down_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 108, 1" offset="6499938424" size="276480" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9429" name="Convert_385779" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9430" name="self.model.layers.39.mlp.down_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9431" name="self.model.layers.39.mlp.down_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="5120, 108, 1" offset="6500214904" size="1105920" /> + <output> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9432" name="self.model.layers.39.mlp.down_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9433" name="Constant_385784" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="922101848" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="9434" name="Reshape_385785" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="9435" name="__module.model.layers.39.mlp.down_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="9436" name="__module.model.layers.39.mlp.down_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6801,hidden_states.1197"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="9437" name="__module.model.layers.39/aten::add/Add_1" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6802,6804,6812,6823,hidden_states.1199,hidden_states.1201"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="9438" name="Constant_290451" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 5120" offset="6501320824" size="20480" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="9439" name="Constant_290450" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064860" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9440" name="Constant_290448" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064864" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9441" name="__module.model.layers.40.input_layernorm/aten::pow/Power" type="Power" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6813"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="9442" name="Constant_27406" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64" names="6814"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9443" name="__module.model.layers.40.input_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> + <data keep_dims="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6815,variance.161"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9444" name="Constant_290449" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064876" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9445" name="__module.model.layers.40.input_layernorm/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6816"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9446" name="__module.model.layers.40.input_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9447" name="__module.model.layers.40.input_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6817"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9448" name="__module.model.layers.40.input_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6818,6819,hidden_states.1203,hidden_states.1205"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="9449" name="__module.model.layers.40.input_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6820,6822,hidden_states.1207"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="9450" name="self.model.layers.40.self_attn.q_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 128" offset="6501341304" size="13107200" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9451" name="Convert_386827" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9452" name="self.model.layers.40.self_attn.q_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 1" offset="6514448504" size="102400" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9453" name="Convert_386829" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9454" name="self.model.layers.40.self_attn.q_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9455" name="self.model.layers.40.self_attn.q_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="5120, 40, 1" offset="6514550904" size="409600" /> + <output> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9456" name="self.model.layers.40.self_attn.q_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9457" name="Constant_386834" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="792684080" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="9458" name="Reshape_386835" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="9459" name="__module.model.layers.40.self_attn.q_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="9460" name="__module.model.layers.40.self_attn.q_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="9461" name="self.model.layers.40.self_attn.q_proj.bias" type="Const" version="opset1"> + <data element_type="bf16" shape="5120" offset="6514960504" size="10240" /> + <output> + <port id="0" precision="BF16" names="self.model.layers.40.self_attn.q_proj.bias"> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="9462" name="__module.model.layers.40.self_attn.q_proj/prim::PythonOp/ConvertLike_1" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="BF16"> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="9463" name="__module.model.layers.40.self_attn.q_proj/prim::PythonOp/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6832,query_states.81"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="9464" name="Constant_301937" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="792694336" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="9465" name="__module.model.layers.40.self_attn/aten::view/Reshape" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6840"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9466" name="__module.model.layers.40.self_attn/aten::transpose/ScatterElementsUpdate" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="9467" name="__module.model.layers.40.self_attn/aten::transpose/Transpose" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6841,q.81"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9468" name="__module.model.layers.40.self_attn/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6850"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9469" name="__module.model.layers.40.self_attn/aten::size/ShapeOf_3" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="9470" name="__module.model.layers.40.self_attn/aten::size/Constant_3" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="9471" name="__module.model.layers.40.self_attn/aten::size/Gather_3" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="6851,6856" /> + </output> + </layer> + <layer id="9472" name="__module.model.layers.40.self_attn/aten::floor_divide/Divide_1" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" /> + </output> + </layer> + <layer id="9473" name="__module.model.layers.40.self_attn/aten::floor_divide/Floor_1" type="Floor" version="opset1"> + <input> + <port id="0" precision="I64" /> + </input> + <output> + <port id="1" precision="I64" names="6853,6854,6858,6859" /> + </output> + </layer> + <layer id="9474" name="Constant_221145" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9475" name="__module.model.layers.40.self_attn/aten::slice/Reshape_5" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9476" name="__module.model.layers.40.self_attn/aten::slice/Reshape_1" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694676" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9477" name="__module.model.layers.40.self_attn/aten::slice/Reshape_2" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9478" name="__module.model.layers.40.self_attn/aten::slice/Reshape_3" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9479" name="__module.model.layers.40.self_attn/aten::slice/Slice" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="6860,x2.161"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="9480" name="Constant_290452" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1, 1" offset="792694684" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9481" name="__module.model.layers.40.self_attn/aten::neg/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6861"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="9482" name="__module.model.layers.40.self_attn/aten::slice/Reshape_4" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9483" name="__module.model.layers.40.self_attn/aten::slice/Reshape_6" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9484" name="__module.model.layers.40.self_attn/aten::slice/Reshape_7" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9485" name="__module.model.layers.40.self_attn/aten::slice/Slice_1" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="6855"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="9486" name="__module.model.layers.40.self_attn/aten::cat/Concat" type="Concat" version="opset1"> + <data axis="-1" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6863"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9487" name="__module.model.layers.40.self_attn/aten::mul/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6864"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9488" name="__module.model.layers.40.self_attn/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6865"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9489" name="Constant_341815" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="9490" name="Constant_341808" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="12" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9491" name="Constant_341810" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9492" name="Constant_341812" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="20" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9493" name="Concat_341813" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="9494" name="Broadcast_341816" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32" /> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9495" name="ReadValue_333216" type="ReadValue" version="opset6"> + <data variable_id="past_key_values.40.keypresent.40.key" variable_type="f32" variable_shape="?,8,?,128" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="past_key_values.40.key"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9496" name="Constant_325549" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="9497" name="Gather_325550" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9498" name="self.model.layers.40.self_attn.k_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 128" offset="6514970744" size="2621440" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9499" name="Convert_387787" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9500" name="self.model.layers.40.self_attn.k_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 1" offset="6517592184" size="20480" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9501" name="Convert_387789" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9502" name="self.model.layers.40.self_attn.k_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9503" name="self.model.layers.40.self_attn.k_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="1024, 40, 1" offset="6517612664" size="81920" /> + <output> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9504" name="self.model.layers.40.self_attn.k_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9505" name="Constant_387794" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795418528" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="9506" name="Reshape_387795" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="9507" name="__module.model.layers.40.self_attn.k_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="9508" name="__module.model.layers.40.self_attn.k_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="9509" name="self.model.layers.40.self_attn.k_proj.bias" type="Const" version="opset1"> + <data element_type="bf16" shape="1024" offset="6517694584" size="2048" /> + <output> + <port id="0" precision="BF16" names="self.model.layers.40.self_attn.k_proj.bias"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="9510" name="__module.model.layers.40.self_attn.k_proj/prim::PythonOp/ConvertLike_1" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="BF16"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="9511" name="__module.model.layers.40.self_attn.k_proj/prim::PythonOp/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6835,key_states.165"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="9512" name="Constant_301938" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420592" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="9513" name="__module.model.layers.40.self_attn/aten::view/Reshape_1" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6843"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9514" name="__module.model.layers.40.self_attn/aten::transpose/ScatterElementsUpdate_1" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="9515" name="__module.model.layers.40.self_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6844,k.81"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9516" name="__module.model.layers.40.self_attn/aten::mul/Multiply_2" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6866"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9517" name="__module.model.layers.40.self_attn/aten::size/ShapeOf_5" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="9518" name="__module.model.layers.40.self_attn/aten::size/Constant_5" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="9519" name="__module.model.layers.40.self_attn/aten::size/Gather_5" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="6867,6872" /> + </output> + </layer> + <layer id="9520" name="__module.model.layers.40.self_attn/aten::floor_divide/Divide_3" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" /> + </output> + </layer> + <layer id="9521" name="__module.model.layers.40.self_attn/aten::floor_divide/Floor_3" type="Floor" version="opset1"> + <input> + <port id="0" precision="I64" /> + </input> + <output> + <port id="1" precision="I64" names="6869,6870,6874,6875" /> + </output> + </layer> + <layer id="9522" name="Constant_221146" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9523" name="__module.model.layers.40.self_attn/aten::slice/Reshape_13" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9524" name="__module.model.layers.40.self_attn/aten::slice/Reshape_9" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694676" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9525" name="__module.model.layers.40.self_attn/aten::slice/Reshape_10" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9526" name="__module.model.layers.40.self_attn/aten::slice/Reshape_11" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9527" name="__module.model.layers.40.self_attn/aten::slice/Slice_2" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="6876,x2.163"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="9528" name="Constant_290453" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1, 1" offset="792694684" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9529" name="__module.model.layers.40.self_attn/aten::neg/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6877"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="9530" name="__module.model.layers.40.self_attn/aten::slice/Reshape_12" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9531" name="__module.model.layers.40.self_attn/aten::slice/Reshape_14" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9532" name="__module.model.layers.40.self_attn/aten::slice/Reshape_15" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9533" name="__module.model.layers.40.self_attn/aten::slice/Slice_3" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="6871"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="9534" name="__module.model.layers.40.self_attn/aten::cat/Concat_1" type="Concat" version="opset1"> + <data axis="-1" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6879"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9535" name="__module.model.layers.40.self_attn/aten::mul/Multiply_3" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6880"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9536" name="__module.model.layers.40.self_attn/aten::add/Add_1" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6881"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9537" name="__module.model.layers.40.self_attn/aten::cat/Concat_2" type="Concat" version="opset1"> + <data axis="-2" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="present.40.key"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9538" name="__module.model.layers.40.self_attn/aten::unsqueeze/Unsqueeze_2" type="Unsqueeze" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="FP32" names="6893,6894,6895"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9539" name="__module.model.layers.40.self_attn/aten::size/ShapeOf_6" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="9540" name="Constant_302564" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="938477672" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="9541" name="Constant_302565" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="9542" name="Gather_302566" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="9543" name="Constant_269274" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="795420624" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9544" name="Constant_277591" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795420632" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="9545" name="Constant_277592" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="9546" name="Gather_277593" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="9547" name="__module.model.layers.40.self_attn/prim::ListConstruct/Concat_2" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="3" precision="I64" names="6896"> + <dim>5</dim> + </port> + </output> + </layer> + <layer id="9548" name="__module.model.layers.40.self_attn/aten::expand/Broadcast" type="Broadcast" version="opset3"> + <data mode="bidirectional" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>5</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6897,hidden_states.1211"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9549" name="Constant_301939" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420648" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="9550" name="__module.model.layers.40.self_attn/aten::reshape/Reshape" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6901,key_states.167"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9551" name="Constant_341828" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="9552" name="Constant_341821" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="12" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9553" name="Constant_341823" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9554" name="Constant_341825" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="20" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9555" name="Concat_341826" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="9556" name="Broadcast_341829" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32" /> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9557" name="ReadValue_333218" type="ReadValue" version="opset6"> + <data variable_id="past_key_values.40.valuepresent.40.value" variable_type="f32" variable_shape="?,8,?,128" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="past_key_values.40.value"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9558" name="Constant_325552" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="9559" name="Gather_325553" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9560" name="self.model.layers.40.self_attn.v_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 128" offset="6517696632" size="2621440" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9561" name="Convert_387797" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9562" name="self.model.layers.40.self_attn.v_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 1" offset="6520318072" size="20480" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9563" name="Convert_387799" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9564" name="self.model.layers.40.self_attn.v_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9565" name="self.model.layers.40.self_attn.v_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="1024, 40, 1" offset="6520338552" size="81920" /> + <output> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9566" name="self.model.layers.40.self_attn.v_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9567" name="Constant_387804" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795418528" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="9568" name="Reshape_387805" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="9569" name="__module.model.layers.40.self_attn.v_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="9570" name="__module.model.layers.40.self_attn.v_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="9571" name="self.model.layers.40.self_attn.v_proj.bias" type="Const" version="opset1"> + <data element_type="bf16" shape="1024" offset="6520420472" size="2048" /> + <output> + <port id="0" precision="BF16" names="self.model.layers.40.self_attn.v_proj.bias"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="9572" name="__module.model.layers.40.self_attn.v_proj/prim::PythonOp/ConvertLike_1" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="BF16"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="9573" name="__module.model.layers.40.self_attn.v_proj/prim::PythonOp/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6838,value_states.81"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="9574" name="Constant_301940" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420592" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="9575" name="__module.model.layers.40.self_attn/aten::view/Reshape_2" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6846"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9576" name="__module.model.layers.40.self_attn/aten::transpose/ScatterElementsUpdate_2" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="9577" name="__module.model.layers.40.self_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6847"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9578" name="__module.model.layers.40.self_attn/aten::cat/Concat_3" type="Concat" version="opset1"> + <data axis="-2" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="present.40.value"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9579" name="__module.model.layers.40.self_attn/aten::unsqueeze/Unsqueeze_3" type="Unsqueeze" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="FP32" names="6909,6910,6911"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9580" name="__module.model.layers.40.self_attn/aten::size/ShapeOf_10" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="9581" name="Constant_302325" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9582" name="__module.model.layers.40.self_attn/aten::size/Constant_11" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="9583" name="__module.model.layers.40.self_attn/aten::size/Gather_11" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="6903"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9584" name="Constant_269292" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="795420624" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9585" name="Constant_277601" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795420632" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="9586" name="Constant_277602" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="9587" name="Gather_277603" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="9588" name="__module.model.layers.40.self_attn/prim::ListConstruct/Concat_5" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="4" precision="I64" names="6912"> + <dim>5</dim> + </port> + </output> + </layer> + <layer id="9589" name="__module.model.layers.40.self_attn/aten::expand/Broadcast_1" type="Broadcast" version="opset3"> + <data mode="bidirectional" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>5</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6913,hidden_states.1215"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9590" name="Constant_301941" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420648" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="9591" name="__module.model.layers.40.self_attn/aten::reshape/Reshape_1" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6917"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9592" name="__module.model.layers.40.self_attn/aten::slice/Reshape_60" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9593" name="ShapeOf_301020" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="9594" name="Constant_301021" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694668" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9595" name="Constant_301022" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="9596" name="Gather_301023" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9597" name="ShapeOf_301024" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="9598" name="Constant_301025" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694668" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9599" name="Constant_301026" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="9600" name="Gather_301027" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9601" name="Add_301028" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64" names="6918"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9602" name="__module.model.layers.40.self_attn/aten::slice/Reshape_62" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9603" name="__module.model.layers.40.self_attn/aten::slice/Reshape_63" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9604" name="__module.model.layers.40.self_attn/aten::slice/Slice_15" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="6922"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="9605" name="__module.model.layers.40.self_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> + <data causal="false" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="6923,attn_output.161"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9606" name="__module.model.layers.40.self_attn/aten::transpose/ScatterElementsUpdate_3" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="9607" name="__module.model.layers.40.self_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6924"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9608" name="Constant_301942" type="Const" version="opset1"> + <data element_type="i64" shape="3" offset="798146608" size="24" /> + <output> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="9609" name="__module.model.layers.40.self_attn/aten::view/Reshape_3" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>3</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6927"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="9610" name="self.model.layers.40.self_attn.o_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 128" offset="6520422520" size="13107200" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9611" name="Convert_386837" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9612" name="self.model.layers.40.self_attn.o_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 1" offset="6533529720" size="102400" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9613" name="Convert_386839" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9614" name="self.model.layers.40.self_attn.o_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9615" name="self.model.layers.40.self_attn.o_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="5120, 40, 1" offset="6533632120" size="409600" /> + <output> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9616" name="self.model.layers.40.self_attn.o_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9617" name="Constant_386844" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="792684080" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="9618" name="Reshape_386845" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="9619" name="__module.model.layers.40.self_attn.o_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="9620" name="__module.model.layers.40.self_attn.o_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6929,6931,hidden_states.1217"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="9621" name="__module.model.layers.40/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6934,6936,6947,hidden_states.1219,hidden_states.1221"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="9622" name="Constant_290457" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 5120" offset="6534041720" size="20480" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="9623" name="Constant_290456" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064860" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9624" name="Constant_290454" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064864" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9625" name="__module.model.layers.40.post_attention_layernorm/aten::pow/Power" type="Power" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6937"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="9626" name="Constant_28004" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64" names="6938"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9627" name="__module.model.layers.40.post_attention_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> + <data keep_dims="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6939,variance.163"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9628" name="Constant_290455" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064876" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9629" name="__module.model.layers.40.post_attention_layernorm/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6940"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9630" name="__module.model.layers.40.post_attention_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9631" name="__module.model.layers.40.post_attention_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6941"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9632" name="__module.model.layers.40.post_attention_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6942,6943,hidden_states.1223,hidden_states.1225"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="9633" name="__module.model.layers.40.post_attention_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6944,6946"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="9634" name="self.model.layers.40.mlp.gate_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 128" offset="6534062200" size="35389440" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9635" name="Convert_385797" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9636" name="self.model.layers.40.mlp.gate_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 1" offset="6569451640" size="276480" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9637" name="Convert_385799" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9638" name="self.model.layers.40.mlp.gate_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9639" name="self.model.layers.40.mlp.gate_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="13824, 40, 1" offset="6569728120" size="1105920" /> + <output> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9640" name="self.model.layers.40.mlp.gate_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9641" name="Constant_385804" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="848558152" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="9642" name="Reshape_385805" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="9643" name="__module.model.layers.40.mlp.gate_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="9644" name="__module.model.layers.40.mlp.gate_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6952,input.81"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="9645" name="__module.model.layers.40.mlp.act_fn/aten::silu/Swish" type="Swish" version="opset4"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="6953"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="9646" name="self.model.layers.40.mlp.up_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 128" offset="6570834040" size="35389440" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9647" name="Convert_385787" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9648" name="self.model.layers.40.mlp.up_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 1" offset="6606223480" size="276480" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9649" name="Convert_385789" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9650" name="self.model.layers.40.mlp.up_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9651" name="self.model.layers.40.mlp.up_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="13824, 40, 1" offset="6606499960" size="1105920" /> + <output> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9652" name="self.model.layers.40.mlp.up_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9653" name="Constant_385794" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="848558152" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="9654" name="Reshape_385795" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="9655" name="__module.model.layers.40.mlp.up_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="9656" name="__module.model.layers.40.mlp.up_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6955"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="9657" name="__module.model.layers.40.mlp/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6956"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="9658" name="self.model.layers.40.mlp.down_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 108, 128" offset="6607605880" size="35389440" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9659" name="Convert_385807" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9660" name="self.model.layers.40.mlp.down_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 108, 1" offset="6642995320" size="276480" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9661" name="Convert_385809" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9662" name="self.model.layers.40.mlp.down_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9663" name="self.model.layers.40.mlp.down_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="5120, 108, 1" offset="6643271800" size="1105920" /> + <output> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9664" name="self.model.layers.40.mlp.down_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9665" name="Constant_385814" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="922101848" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="9666" name="Reshape_385815" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="9667" name="__module.model.layers.40.mlp.down_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="9668" name="__module.model.layers.40.mlp.down_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6958,hidden_states.1227"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="9669" name="__module.model.layers.40/aten::add/Add_1" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6959,6961,6969,6980,hidden_states.1229,hidden_states.1231"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="9670" name="Constant_290461" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 5120" offset="6644377720" size="20480" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="9671" name="Constant_290460" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064860" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9672" name="Constant_290458" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064864" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9673" name="__module.model.layers.41.input_layernorm/aten::pow/Power" type="Power" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6970"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="9674" name="Constant_28078" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64" names="6971"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9675" name="__module.model.layers.41.input_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> + <data keep_dims="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6972,variance.165"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9676" name="Constant_290459" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064876" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9677" name="__module.model.layers.41.input_layernorm/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6973"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9678" name="__module.model.layers.41.input_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9679" name="__module.model.layers.41.input_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6974"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9680" name="__module.model.layers.41.input_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6975,6976,hidden_states.1233,hidden_states.1235"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="9681" name="__module.model.layers.41.input_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6977,6979,hidden_states.1237"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="9682" name="self.model.layers.41.self_attn.q_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 128" offset="6644398200" size="13107200" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9683" name="Convert_386847" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9684" name="self.model.layers.41.self_attn.q_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 1" offset="6657505400" size="102400" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9685" name="Convert_386849" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9686" name="self.model.layers.41.self_attn.q_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9687" name="self.model.layers.41.self_attn.q_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="5120, 40, 1" offset="6657607800" size="409600" /> + <output> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9688" name="self.model.layers.41.self_attn.q_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9689" name="Constant_386854" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="792684080" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="9690" name="Reshape_386855" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="9691" name="__module.model.layers.41.self_attn.q_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="9692" name="__module.model.layers.41.self_attn.q_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="9693" name="self.model.layers.41.self_attn.q_proj.bias" type="Const" version="opset1"> + <data element_type="bf16" shape="5120" offset="6658017400" size="10240" /> + <output> + <port id="0" precision="BF16" names="self.model.layers.41.self_attn.q_proj.bias"> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="9694" name="__module.model.layers.41.self_attn.q_proj/prim::PythonOp/ConvertLike_1" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="BF16"> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="9695" name="__module.model.layers.41.self_attn.q_proj/prim::PythonOp/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6989,query_states.83"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="9696" name="Constant_301943" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="792694336" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="9697" name="__module.model.layers.41.self_attn/aten::view/Reshape" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6997"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9698" name="__module.model.layers.41.self_attn/aten::transpose/ScatterElementsUpdate" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="9699" name="__module.model.layers.41.self_attn/aten::transpose/Transpose" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6998,q.83"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9700" name="__module.model.layers.41.self_attn/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7007"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9701" name="__module.model.layers.41.self_attn/aten::size/ShapeOf_3" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="9702" name="__module.model.layers.41.self_attn/aten::size/Constant_3" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="9703" name="__module.model.layers.41.self_attn/aten::size/Gather_3" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="7008,7013" /> + </output> + </layer> + <layer id="9704" name="__module.model.layers.41.self_attn/aten::floor_divide/Divide_1" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" /> + </output> + </layer> + <layer id="9705" name="__module.model.layers.41.self_attn/aten::floor_divide/Floor_1" type="Floor" version="opset1"> + <input> + <port id="0" precision="I64" /> + </input> + <output> + <port id="1" precision="I64" names="7010,7011,7015,7016" /> + </output> + </layer> + <layer id="9706" name="Constant_221160" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9707" name="__module.model.layers.41.self_attn/aten::slice/Reshape_5" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9708" name="__module.model.layers.41.self_attn/aten::slice/Reshape_1" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694676" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9709" name="__module.model.layers.41.self_attn/aten::slice/Reshape_2" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9710" name="__module.model.layers.41.self_attn/aten::slice/Reshape_3" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9711" name="__module.model.layers.41.self_attn/aten::slice/Slice" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="7017,x2.165"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="9712" name="Constant_290462" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1, 1" offset="792694684" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9713" name="__module.model.layers.41.self_attn/aten::neg/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7018"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="9714" name="__module.model.layers.41.self_attn/aten::slice/Reshape_4" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9715" name="__module.model.layers.41.self_attn/aten::slice/Reshape_6" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9716" name="__module.model.layers.41.self_attn/aten::slice/Reshape_7" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9717" name="__module.model.layers.41.self_attn/aten::slice/Slice_1" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="7012"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="9718" name="__module.model.layers.41.self_attn/aten::cat/Concat" type="Concat" version="opset1"> + <data axis="-1" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7020"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9719" name="__module.model.layers.41.self_attn/aten::mul/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7021"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9720" name="__module.model.layers.41.self_attn/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7022"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9721" name="Constant_341841" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="9722" name="Constant_341834" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="12" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9723" name="Constant_341836" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9724" name="Constant_341838" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="20" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9725" name="Concat_341839" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="9726" name="Broadcast_341842" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32" /> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9727" name="ReadValue_333220" type="ReadValue" version="opset6"> + <data variable_id="past_key_values.41.keypresent.41.key" variable_type="f32" variable_shape="?,8,?,128" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="past_key_values.41.key"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9728" name="Constant_325555" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="9729" name="Gather_325556" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9730" name="self.model.layers.41.self_attn.k_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 128" offset="6658027640" size="2621440" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9731" name="Convert_387807" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9732" name="self.model.layers.41.self_attn.k_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 1" offset="6660649080" size="20480" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9733" name="Convert_387809" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9734" name="self.model.layers.41.self_attn.k_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9735" name="self.model.layers.41.self_attn.k_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="1024, 40, 1" offset="6660669560" size="81920" /> + <output> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9736" name="self.model.layers.41.self_attn.k_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9737" name="Constant_387814" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795418528" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="9738" name="Reshape_387815" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="9739" name="__module.model.layers.41.self_attn.k_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="9740" name="__module.model.layers.41.self_attn.k_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="9741" name="self.model.layers.41.self_attn.k_proj.bias" type="Const" version="opset1"> + <data element_type="bf16" shape="1024" offset="6660751480" size="2048" /> + <output> + <port id="0" precision="BF16" names="self.model.layers.41.self_attn.k_proj.bias"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="9742" name="__module.model.layers.41.self_attn.k_proj/prim::PythonOp/ConvertLike_1" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="BF16"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="9743" name="__module.model.layers.41.self_attn.k_proj/prim::PythonOp/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6992,key_states.169"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="9744" name="Constant_301944" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420592" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="9745" name="__module.model.layers.41.self_attn/aten::view/Reshape_1" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7000"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9746" name="__module.model.layers.41.self_attn/aten::transpose/ScatterElementsUpdate_1" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="9747" name="__module.model.layers.41.self_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7001,k.83"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9748" name="__module.model.layers.41.self_attn/aten::mul/Multiply_2" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7023"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9749" name="__module.model.layers.41.self_attn/aten::size/ShapeOf_5" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="9750" name="__module.model.layers.41.self_attn/aten::size/Constant_5" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="9751" name="__module.model.layers.41.self_attn/aten::size/Gather_5" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="7024,7029" /> + </output> + </layer> + <layer id="9752" name="__module.model.layers.41.self_attn/aten::floor_divide/Divide_3" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" /> + </output> + </layer> + <layer id="9753" name="__module.model.layers.41.self_attn/aten::floor_divide/Floor_3" type="Floor" version="opset1"> + <input> + <port id="0" precision="I64" /> + </input> + <output> + <port id="1" precision="I64" names="7026,7027,7031,7032" /> + </output> + </layer> + <layer id="9754" name="Constant_221161" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9755" name="__module.model.layers.41.self_attn/aten::slice/Reshape_13" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9756" name="__module.model.layers.41.self_attn/aten::slice/Reshape_9" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694676" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9757" name="__module.model.layers.41.self_attn/aten::slice/Reshape_10" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9758" name="__module.model.layers.41.self_attn/aten::slice/Reshape_11" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9759" name="__module.model.layers.41.self_attn/aten::slice/Slice_2" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="7033,x2.167"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="9760" name="Constant_290463" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1, 1" offset="792694684" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9761" name="__module.model.layers.41.self_attn/aten::neg/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7034"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="9762" name="__module.model.layers.41.self_attn/aten::slice/Reshape_12" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9763" name="__module.model.layers.41.self_attn/aten::slice/Reshape_14" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9764" name="__module.model.layers.41.self_attn/aten::slice/Reshape_15" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9765" name="__module.model.layers.41.self_attn/aten::slice/Slice_3" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="7028"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="9766" name="__module.model.layers.41.self_attn/aten::cat/Concat_1" type="Concat" version="opset1"> + <data axis="-1" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7036"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9767" name="__module.model.layers.41.self_attn/aten::mul/Multiply_3" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7037"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9768" name="__module.model.layers.41.self_attn/aten::add/Add_1" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7038"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9769" name="__module.model.layers.41.self_attn/aten::cat/Concat_2" type="Concat" version="opset1"> + <data axis="-2" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="present.41.key"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9770" name="__module.model.layers.41.self_attn/aten::unsqueeze/Unsqueeze_2" type="Unsqueeze" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="FP32" names="7050,7051,7052"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9771" name="__module.model.layers.41.self_attn/aten::size/ShapeOf_6" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="9772" name="Constant_302569" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="938477672" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="9773" name="Constant_302570" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="9774" name="Gather_302571" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="9775" name="Constant_269310" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="795420624" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9776" name="Constant_277626" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795420632" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="9777" name="Constant_277627" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="9778" name="Gather_277628" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="9779" name="__module.model.layers.41.self_attn/prim::ListConstruct/Concat_2" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="3" precision="I64" names="7053"> + <dim>5</dim> + </port> + </output> + </layer> + <layer id="9780" name="__module.model.layers.41.self_attn/aten::expand/Broadcast" type="Broadcast" version="opset3"> + <data mode="bidirectional" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>5</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7054,hidden_states.1241"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9781" name="Constant_301945" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420648" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="9782" name="__module.model.layers.41.self_attn/aten::reshape/Reshape" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7058,key_states.171"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9783" name="Constant_341854" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="9784" name="Constant_341847" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="12" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9785" name="Constant_341849" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9786" name="Constant_341851" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="20" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9787" name="Concat_341852" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="9788" name="Broadcast_341855" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32" /> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9789" name="ReadValue_333222" type="ReadValue" version="opset6"> + <data variable_id="past_key_values.41.valuepresent.41.value" variable_type="f32" variable_shape="?,8,?,128" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="past_key_values.41.value"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9790" name="Constant_325558" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="9791" name="Gather_325559" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9792" name="self.model.layers.41.self_attn.v_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 128" offset="6660753528" size="2621440" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9793" name="Convert_387817" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9794" name="self.model.layers.41.self_attn.v_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 1" offset="6663374968" size="20480" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9795" name="Convert_387819" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9796" name="self.model.layers.41.self_attn.v_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9797" name="self.model.layers.41.self_attn.v_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="1024, 40, 1" offset="6663395448" size="81920" /> + <output> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9798" name="self.model.layers.41.self_attn.v_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9799" name="Constant_387824" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795418528" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="9800" name="Reshape_387825" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="9801" name="__module.model.layers.41.self_attn.v_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="9802" name="__module.model.layers.41.self_attn.v_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="9803" name="self.model.layers.41.self_attn.v_proj.bias" type="Const" version="opset1"> + <data element_type="bf16" shape="1024" offset="6663477368" size="2048" /> + <output> + <port id="0" precision="BF16" names="self.model.layers.41.self_attn.v_proj.bias"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="9804" name="__module.model.layers.41.self_attn.v_proj/prim::PythonOp/ConvertLike_1" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="BF16"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="9805" name="__module.model.layers.41.self_attn.v_proj/prim::PythonOp/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="6995,value_states.83"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="9806" name="Constant_301946" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420592" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="9807" name="__module.model.layers.41.self_attn/aten::view/Reshape_2" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7003"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9808" name="__module.model.layers.41.self_attn/aten::transpose/ScatterElementsUpdate_2" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="9809" name="__module.model.layers.41.self_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7004"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9810" name="__module.model.layers.41.self_attn/aten::cat/Concat_3" type="Concat" version="opset1"> + <data axis="-2" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="present.41.value"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9811" name="__module.model.layers.41.self_attn/aten::unsqueeze/Unsqueeze_3" type="Unsqueeze" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="FP32" names="7066,7067,7068"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9812" name="__module.model.layers.41.self_attn/aten::size/ShapeOf_10" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="9813" name="Constant_302331" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9814" name="__module.model.layers.41.self_attn/aten::size/Constant_11" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="9815" name="__module.model.layers.41.self_attn/aten::size/Gather_11" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="7060"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9816" name="Constant_269328" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="795420624" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9817" name="Constant_277636" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795420632" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="9818" name="Constant_277637" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="9819" name="Gather_277638" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="9820" name="__module.model.layers.41.self_attn/prim::ListConstruct/Concat_5" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="4" precision="I64" names="7069"> + <dim>5</dim> + </port> + </output> + </layer> + <layer id="9821" name="__module.model.layers.41.self_attn/aten::expand/Broadcast_1" type="Broadcast" version="opset3"> + <data mode="bidirectional" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>5</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7070,hidden_states.1245"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9822" name="Constant_301947" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420648" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="9823" name="__module.model.layers.41.self_attn/aten::reshape/Reshape_1" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7074"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9824" name="__module.model.layers.41.self_attn/aten::slice/Reshape_60" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9825" name="ShapeOf_301106" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="9826" name="Constant_301107" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694668" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9827" name="Constant_301108" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="9828" name="Gather_301109" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9829" name="ShapeOf_301110" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="9830" name="Constant_301111" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694668" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9831" name="Constant_301112" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="9832" name="Gather_301113" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9833" name="Add_301114" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64" names="7075"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9834" name="__module.model.layers.41.self_attn/aten::slice/Reshape_62" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9835" name="__module.model.layers.41.self_attn/aten::slice/Reshape_63" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9836" name="__module.model.layers.41.self_attn/aten::slice/Slice_15" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="7079"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="9837" name="__module.model.layers.41.self_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> + <data causal="false" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="7080,attn_output.165"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9838" name="__module.model.layers.41.self_attn/aten::transpose/ScatterElementsUpdate_3" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="9839" name="__module.model.layers.41.self_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7081"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9840" name="Constant_301948" type="Const" version="opset1"> + <data element_type="i64" shape="3" offset="798146608" size="24" /> + <output> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="9841" name="__module.model.layers.41.self_attn/aten::view/Reshape_3" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>3</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7084"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="9842" name="self.model.layers.41.self_attn.o_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 128" offset="6663479416" size="13107200" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9843" name="Convert_386857" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9844" name="self.model.layers.41.self_attn.o_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 1" offset="6676586616" size="102400" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9845" name="Convert_386859" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9846" name="self.model.layers.41.self_attn.o_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9847" name="self.model.layers.41.self_attn.o_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="5120, 40, 1" offset="6676689016" size="409600" /> + <output> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9848" name="self.model.layers.41.self_attn.o_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9849" name="Constant_386864" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="792684080" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="9850" name="Reshape_386865" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="9851" name="__module.model.layers.41.self_attn.o_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="9852" name="__module.model.layers.41.self_attn.o_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7086,7088,hidden_states.1247"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="9853" name="__module.model.layers.41/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7091,7093,7104,hidden_states.1249,hidden_states.1251"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="9854" name="Constant_290467" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 5120" offset="6677098616" size="20480" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="9855" name="Constant_290466" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064860" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9856" name="Constant_290464" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064864" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9857" name="__module.model.layers.41.post_attention_layernorm/aten::pow/Power" type="Power" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7094"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="9858" name="Constant_28676" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64" names="7095"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9859" name="__module.model.layers.41.post_attention_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> + <data keep_dims="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7096,variance.167"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9860" name="Constant_290465" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064876" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9861" name="__module.model.layers.41.post_attention_layernorm/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7097"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9862" name="__module.model.layers.41.post_attention_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9863" name="__module.model.layers.41.post_attention_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7098"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9864" name="__module.model.layers.41.post_attention_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7099,7100,hidden_states.1253,hidden_states.1255"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="9865" name="__module.model.layers.41.post_attention_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7101,7103"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="9866" name="self.model.layers.41.mlp.gate_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 128" offset="6677119096" size="35389440" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9867" name="Convert_385827" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9868" name="self.model.layers.41.mlp.gate_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 1" offset="6712508536" size="276480" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9869" name="Convert_385829" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9870" name="self.model.layers.41.mlp.gate_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9871" name="self.model.layers.41.mlp.gate_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="13824, 40, 1" offset="6712785016" size="1105920" /> + <output> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9872" name="self.model.layers.41.mlp.gate_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9873" name="Constant_385834" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="848558152" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="9874" name="Reshape_385835" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="9875" name="__module.model.layers.41.mlp.gate_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="9876" name="__module.model.layers.41.mlp.gate_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7109,input.83"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="9877" name="__module.model.layers.41.mlp.act_fn/aten::silu/Swish" type="Swish" version="opset4"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="7110"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="9878" name="self.model.layers.41.mlp.up_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 128" offset="6713890936" size="35389440" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9879" name="Convert_385817" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9880" name="self.model.layers.41.mlp.up_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 1" offset="6749280376" size="276480" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9881" name="Convert_385819" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9882" name="self.model.layers.41.mlp.up_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9883" name="self.model.layers.41.mlp.up_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="13824, 40, 1" offset="6749556856" size="1105920" /> + <output> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9884" name="self.model.layers.41.mlp.up_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9885" name="Constant_385824" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="848558152" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="9886" name="Reshape_385825" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="9887" name="__module.model.layers.41.mlp.up_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="9888" name="__module.model.layers.41.mlp.up_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7112"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="9889" name="__module.model.layers.41.mlp/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7113"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="9890" name="self.model.layers.41.mlp.down_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 108, 128" offset="6750662776" size="35389440" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9891" name="Convert_385837" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9892" name="self.model.layers.41.mlp.down_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 108, 1" offset="6786052216" size="276480" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9893" name="Convert_385839" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9894" name="self.model.layers.41.mlp.down_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9895" name="self.model.layers.41.mlp.down_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="5120, 108, 1" offset="6786328696" size="1105920" /> + <output> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9896" name="self.model.layers.41.mlp.down_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9897" name="Constant_385844" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="922101848" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="9898" name="Reshape_385845" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="9899" name="__module.model.layers.41.mlp.down_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="9900" name="__module.model.layers.41.mlp.down_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7115,hidden_states.1257"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="9901" name="__module.model.layers.41/aten::add/Add_1" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7116,7118,7126,7137,hidden_states.1259,hidden_states.1261"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="9902" name="Constant_290471" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 5120" offset="6787434616" size="20480" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="9903" name="Constant_290470" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064860" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9904" name="Constant_290468" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064864" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9905" name="__module.model.layers.42.input_layernorm/aten::pow/Power" type="Power" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7127"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="9906" name="Constant_28750" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64" names="7128"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9907" name="__module.model.layers.42.input_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> + <data keep_dims="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7129,variance.169"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9908" name="Constant_290469" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064876" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9909" name="__module.model.layers.42.input_layernorm/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7130"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9910" name="__module.model.layers.42.input_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9911" name="__module.model.layers.42.input_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7131"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9912" name="__module.model.layers.42.input_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7132,7133,hidden_states.1263,hidden_states.1265"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="9913" name="__module.model.layers.42.input_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7134,7136,hidden_states.1267"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="9914" name="self.model.layers.42.self_attn.q_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 128" offset="6787455096" size="13107200" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9915" name="Convert_386867" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9916" name="self.model.layers.42.self_attn.q_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 1" offset="6800562296" size="102400" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9917" name="Convert_386869" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9918" name="self.model.layers.42.self_attn.q_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9919" name="self.model.layers.42.self_attn.q_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="5120, 40, 1" offset="6800664696" size="409600" /> + <output> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9920" name="self.model.layers.42.self_attn.q_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9921" name="Constant_386874" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="792684080" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="9922" name="Reshape_386875" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="9923" name="__module.model.layers.42.self_attn.q_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="9924" name="__module.model.layers.42.self_attn.q_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="9925" name="self.model.layers.42.self_attn.q_proj.bias" type="Const" version="opset1"> + <data element_type="bf16" shape="5120" offset="6801074296" size="10240" /> + <output> + <port id="0" precision="BF16" names="self.model.layers.42.self_attn.q_proj.bias"> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="9926" name="__module.model.layers.42.self_attn.q_proj/prim::PythonOp/ConvertLike_1" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="BF16"> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="9927" name="__module.model.layers.42.self_attn.q_proj/prim::PythonOp/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7146,query_states.85"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="9928" name="Constant_301949" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="792694336" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="9929" name="__module.model.layers.42.self_attn/aten::view/Reshape" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7154"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9930" name="__module.model.layers.42.self_attn/aten::transpose/ScatterElementsUpdate" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="9931" name="__module.model.layers.42.self_attn/aten::transpose/Transpose" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7155,q.85"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9932" name="__module.model.layers.42.self_attn/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7164"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9933" name="__module.model.layers.42.self_attn/aten::size/ShapeOf_3" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="9934" name="__module.model.layers.42.self_attn/aten::size/Constant_3" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="9935" name="__module.model.layers.42.self_attn/aten::size/Gather_3" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="7165,7170" /> + </output> + </layer> + <layer id="9936" name="__module.model.layers.42.self_attn/aten::floor_divide/Divide_1" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" /> + </output> + </layer> + <layer id="9937" name="__module.model.layers.42.self_attn/aten::floor_divide/Floor_1" type="Floor" version="opset1"> + <input> + <port id="0" precision="I64" /> + </input> + <output> + <port id="1" precision="I64" names="7167,7168,7172,7173" /> + </output> + </layer> + <layer id="9938" name="Constant_221175" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9939" name="__module.model.layers.42.self_attn/aten::slice/Reshape_5" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9940" name="__module.model.layers.42.self_attn/aten::slice/Reshape_1" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694676" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9941" name="__module.model.layers.42.self_attn/aten::slice/Reshape_2" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9942" name="__module.model.layers.42.self_attn/aten::slice/Reshape_3" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9943" name="__module.model.layers.42.self_attn/aten::slice/Slice" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="7174,x2.169"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="9944" name="Constant_290472" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1, 1" offset="792694684" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9945" name="__module.model.layers.42.self_attn/aten::neg/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7175"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="9946" name="__module.model.layers.42.self_attn/aten::slice/Reshape_4" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9947" name="__module.model.layers.42.self_attn/aten::slice/Reshape_6" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9948" name="__module.model.layers.42.self_attn/aten::slice/Reshape_7" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9949" name="__module.model.layers.42.self_attn/aten::slice/Slice_1" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="7169"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="9950" name="__module.model.layers.42.self_attn/aten::cat/Concat" type="Concat" version="opset1"> + <data axis="-1" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7177"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9951" name="__module.model.layers.42.self_attn/aten::mul/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7178"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9952" name="__module.model.layers.42.self_attn/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7179"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9953" name="Constant_341867" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="9954" name="Constant_341860" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="12" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9955" name="Constant_341862" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9956" name="Constant_341864" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="20" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9957" name="Concat_341865" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="9958" name="Broadcast_341868" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32" /> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9959" name="ReadValue_333224" type="ReadValue" version="opset6"> + <data variable_id="past_key_values.42.keypresent.42.key" variable_type="f32" variable_shape="?,8,?,128" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="past_key_values.42.key"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9960" name="Constant_325561" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="9961" name="Gather_325562" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9962" name="self.model.layers.42.self_attn.k_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 128" offset="6801084536" size="2621440" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9963" name="Convert_387827" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9964" name="self.model.layers.42.self_attn.k_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 1" offset="6803705976" size="20480" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9965" name="Convert_387829" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9966" name="self.model.layers.42.self_attn.k_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9967" name="self.model.layers.42.self_attn.k_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="1024, 40, 1" offset="6803726456" size="81920" /> + <output> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9968" name="self.model.layers.42.self_attn.k_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9969" name="Constant_387834" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795418528" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="9970" name="Reshape_387835" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="9971" name="__module.model.layers.42.self_attn.k_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="9972" name="__module.model.layers.42.self_attn.k_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="9973" name="self.model.layers.42.self_attn.k_proj.bias" type="Const" version="opset1"> + <data element_type="bf16" shape="1024" offset="6803808376" size="2048" /> + <output> + <port id="0" precision="BF16" names="self.model.layers.42.self_attn.k_proj.bias"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="9974" name="__module.model.layers.42.self_attn.k_proj/prim::PythonOp/ConvertLike_1" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="BF16"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="9975" name="__module.model.layers.42.self_attn.k_proj/prim::PythonOp/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7149,key_states.173"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="9976" name="Constant_301950" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420592" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="9977" name="__module.model.layers.42.self_attn/aten::view/Reshape_1" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7157"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9978" name="__module.model.layers.42.self_attn/aten::transpose/ScatterElementsUpdate_1" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="9979" name="__module.model.layers.42.self_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7158,k.85"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9980" name="__module.model.layers.42.self_attn/aten::mul/Multiply_2" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7180"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9981" name="__module.model.layers.42.self_attn/aten::size/ShapeOf_5" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="9982" name="__module.model.layers.42.self_attn/aten::size/Constant_5" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="9983" name="__module.model.layers.42.self_attn/aten::size/Gather_5" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="7181,7186" /> + </output> + </layer> + <layer id="9984" name="__module.model.layers.42.self_attn/aten::floor_divide/Divide_3" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" /> + </output> + </layer> + <layer id="9985" name="__module.model.layers.42.self_attn/aten::floor_divide/Floor_3" type="Floor" version="opset1"> + <input> + <port id="0" precision="I64" /> + </input> + <output> + <port id="1" precision="I64" names="7183,7184,7188,7189" /> + </output> + </layer> + <layer id="9986" name="Constant_221176" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9987" name="__module.model.layers.42.self_attn/aten::slice/Reshape_13" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9988" name="__module.model.layers.42.self_attn/aten::slice/Reshape_9" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694676" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9989" name="__module.model.layers.42.self_attn/aten::slice/Reshape_10" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9990" name="__module.model.layers.42.self_attn/aten::slice/Reshape_11" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9991" name="__module.model.layers.42.self_attn/aten::slice/Slice_2" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="7190,x2.171"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="9992" name="Constant_290473" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1, 1" offset="792694684" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9993" name="__module.model.layers.42.self_attn/aten::neg/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7191"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="9994" name="__module.model.layers.42.self_attn/aten::slice/Reshape_12" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9995" name="__module.model.layers.42.self_attn/aten::slice/Reshape_14" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9996" name="__module.model.layers.42.self_attn/aten::slice/Reshape_15" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="9997" name="__module.model.layers.42.self_attn/aten::slice/Slice_3" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="7185"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="9998" name="__module.model.layers.42.self_attn/aten::cat/Concat_1" type="Concat" version="opset1"> + <data axis="-1" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7193"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="9999" name="__module.model.layers.42.self_attn/aten::mul/Multiply_3" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7194"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10000" name="__module.model.layers.42.self_attn/aten::add/Add_1" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7195"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10001" name="__module.model.layers.42.self_attn/aten::cat/Concat_2" type="Concat" version="opset1"> + <data axis="-2" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="present.42.key"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10002" name="__module.model.layers.42.self_attn/aten::unsqueeze/Unsqueeze_2" type="Unsqueeze" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="FP32" names="7207,7208,7209"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10003" name="__module.model.layers.42.self_attn/aten::size/ShapeOf_6" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="10004" name="Constant_302574" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="938477672" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="10005" name="Constant_302575" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="10006" name="Gather_302576" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="10007" name="Constant_269346" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="795420624" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10008" name="Constant_277661" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795420632" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="10009" name="Constant_277662" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="10010" name="Gather_277663" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="10011" name="__module.model.layers.42.self_attn/prim::ListConstruct/Concat_2" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="3" precision="I64" names="7210"> + <dim>5</dim> + </port> + </output> + </layer> + <layer id="10012" name="__module.model.layers.42.self_attn/aten::expand/Broadcast" type="Broadcast" version="opset3"> + <data mode="bidirectional" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>5</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7211,hidden_states.1271"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10013" name="Constant_301951" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420648" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="10014" name="__module.model.layers.42.self_attn/aten::reshape/Reshape" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7215,key_states.175"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10015" name="Constant_341880" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="10016" name="Constant_341873" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="12" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10017" name="Constant_341875" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10018" name="Constant_341877" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="20" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10019" name="Concat_341878" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="10020" name="Broadcast_341881" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32" /> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10021" name="ReadValue_333226" type="ReadValue" version="opset6"> + <data variable_id="past_key_values.42.valuepresent.42.value" variable_type="f32" variable_shape="?,8,?,128" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="past_key_values.42.value"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10022" name="Constant_325564" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="10023" name="Gather_325565" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10024" name="self.model.layers.42.self_attn.v_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 128" offset="6803810424" size="2621440" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10025" name="Convert_387837" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10026" name="self.model.layers.42.self_attn.v_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 1" offset="6806431864" size="20480" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10027" name="Convert_387839" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10028" name="self.model.layers.42.self_attn.v_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10029" name="self.model.layers.42.self_attn.v_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="1024, 40, 1" offset="6806452344" size="81920" /> + <output> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10030" name="self.model.layers.42.self_attn.v_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10031" name="Constant_387844" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795418528" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="10032" name="Reshape_387845" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="10033" name="__module.model.layers.42.self_attn.v_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="10034" name="__module.model.layers.42.self_attn.v_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="10035" name="self.model.layers.42.self_attn.v_proj.bias" type="Const" version="opset1"> + <data element_type="bf16" shape="1024" offset="6806534264" size="2048" /> + <output> + <port id="0" precision="BF16" names="self.model.layers.42.self_attn.v_proj.bias"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="10036" name="__module.model.layers.42.self_attn.v_proj/prim::PythonOp/ConvertLike_1" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="BF16"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="10037" name="__module.model.layers.42.self_attn.v_proj/prim::PythonOp/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7152,value_states.85"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="10038" name="Constant_301952" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420592" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="10039" name="__module.model.layers.42.self_attn/aten::view/Reshape_2" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7160"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10040" name="__module.model.layers.42.self_attn/aten::transpose/ScatterElementsUpdate_2" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="10041" name="__module.model.layers.42.self_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7161"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10042" name="__module.model.layers.42.self_attn/aten::cat/Concat_3" type="Concat" version="opset1"> + <data axis="-2" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="present.42.value"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10043" name="__module.model.layers.42.self_attn/aten::unsqueeze/Unsqueeze_3" type="Unsqueeze" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="FP32" names="7223,7224,7225"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10044" name="__module.model.layers.42.self_attn/aten::size/ShapeOf_10" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="10045" name="Constant_302337" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10046" name="__module.model.layers.42.self_attn/aten::size/Constant_11" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="10047" name="__module.model.layers.42.self_attn/aten::size/Gather_11" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="7217"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10048" name="Constant_269364" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="795420624" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10049" name="Constant_277671" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795420632" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="10050" name="Constant_277672" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="10051" name="Gather_277673" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="10052" name="__module.model.layers.42.self_attn/prim::ListConstruct/Concat_5" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="4" precision="I64" names="7226"> + <dim>5</dim> + </port> + </output> + </layer> + <layer id="10053" name="__module.model.layers.42.self_attn/aten::expand/Broadcast_1" type="Broadcast" version="opset3"> + <data mode="bidirectional" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>5</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7227,hidden_states.1275"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10054" name="Constant_301953" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420648" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="10055" name="__module.model.layers.42.self_attn/aten::reshape/Reshape_1" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7231"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10056" name="__module.model.layers.42.self_attn/aten::slice/Reshape_60" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10057" name="ShapeOf_301192" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="10058" name="Constant_301193" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694668" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10059" name="Constant_301194" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="10060" name="Gather_301195" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10061" name="ShapeOf_301196" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="10062" name="Constant_301197" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694668" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10063" name="Constant_301198" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="10064" name="Gather_301199" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10065" name="Add_301200" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64" names="7232"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10066" name="__module.model.layers.42.self_attn/aten::slice/Reshape_62" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10067" name="__module.model.layers.42.self_attn/aten::slice/Reshape_63" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10068" name="__module.model.layers.42.self_attn/aten::slice/Slice_15" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="7236"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="10069" name="__module.model.layers.42.self_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> + <data causal="false" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="7237,attn_output.169"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10070" name="__module.model.layers.42.self_attn/aten::transpose/ScatterElementsUpdate_3" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="10071" name="__module.model.layers.42.self_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7238"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10072" name="Constant_301954" type="Const" version="opset1"> + <data element_type="i64" shape="3" offset="798146608" size="24" /> + <output> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="10073" name="__module.model.layers.42.self_attn/aten::view/Reshape_3" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>3</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7241"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="10074" name="self.model.layers.42.self_attn.o_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 128" offset="6806536312" size="13107200" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10075" name="Convert_386877" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10076" name="self.model.layers.42.self_attn.o_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 1" offset="6819643512" size="102400" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10077" name="Convert_386879" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10078" name="self.model.layers.42.self_attn.o_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10079" name="self.model.layers.42.self_attn.o_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="5120, 40, 1" offset="6819745912" size="409600" /> + <output> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10080" name="self.model.layers.42.self_attn.o_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10081" name="Constant_386884" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="792684080" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="10082" name="Reshape_386885" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="10083" name="__module.model.layers.42.self_attn.o_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="10084" name="__module.model.layers.42.self_attn.o_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7243,7245,hidden_states.1277"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="10085" name="__module.model.layers.42/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7248,7250,7261,hidden_states.1279,hidden_states.1281"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="10086" name="Constant_290477" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 5120" offset="6820155512" size="20480" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="10087" name="Constant_290476" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064860" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10088" name="Constant_290474" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064864" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10089" name="__module.model.layers.42.post_attention_layernorm/aten::pow/Power" type="Power" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7251"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="10090" name="Constant_29348" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64" names="7252"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10091" name="__module.model.layers.42.post_attention_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> + <data keep_dims="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7253,variance.171"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10092" name="Constant_290475" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064876" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10093" name="__module.model.layers.42.post_attention_layernorm/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7254"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10094" name="__module.model.layers.42.post_attention_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10095" name="__module.model.layers.42.post_attention_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7255"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10096" name="__module.model.layers.42.post_attention_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7256,7257,hidden_states.1283,hidden_states.1285"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="10097" name="__module.model.layers.42.post_attention_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7258,7260"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="10098" name="self.model.layers.42.mlp.gate_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 128" offset="6820175992" size="35389440" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10099" name="Convert_385857" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10100" name="self.model.layers.42.mlp.gate_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 1" offset="6855565432" size="276480" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10101" name="Convert_385859" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10102" name="self.model.layers.42.mlp.gate_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10103" name="self.model.layers.42.mlp.gate_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="13824, 40, 1" offset="6855841912" size="1105920" /> + <output> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10104" name="self.model.layers.42.mlp.gate_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10105" name="Constant_385864" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="848558152" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="10106" name="Reshape_385865" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="10107" name="__module.model.layers.42.mlp.gate_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="10108" name="__module.model.layers.42.mlp.gate_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7266,input.85"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="10109" name="__module.model.layers.42.mlp.act_fn/aten::silu/Swish" type="Swish" version="opset4"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="7267"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="10110" name="self.model.layers.42.mlp.up_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 128" offset="6856947832" size="35389440" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10111" name="Convert_385847" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10112" name="self.model.layers.42.mlp.up_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 1" offset="6892337272" size="276480" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10113" name="Convert_385849" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10114" name="self.model.layers.42.mlp.up_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10115" name="self.model.layers.42.mlp.up_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="13824, 40, 1" offset="6892613752" size="1105920" /> + <output> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10116" name="self.model.layers.42.mlp.up_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10117" name="Constant_385854" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="848558152" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="10118" name="Reshape_385855" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="10119" name="__module.model.layers.42.mlp.up_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="10120" name="__module.model.layers.42.mlp.up_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7269"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="10121" name="__module.model.layers.42.mlp/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7270"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="10122" name="self.model.layers.42.mlp.down_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 108, 128" offset="6893719672" size="35389440" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10123" name="Convert_385867" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10124" name="self.model.layers.42.mlp.down_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 108, 1" offset="6929109112" size="276480" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10125" name="Convert_385869" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10126" name="self.model.layers.42.mlp.down_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10127" name="self.model.layers.42.mlp.down_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="5120, 108, 1" offset="6929385592" size="1105920" /> + <output> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10128" name="self.model.layers.42.mlp.down_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10129" name="Constant_385874" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="922101848" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="10130" name="Reshape_385875" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="10131" name="__module.model.layers.42.mlp.down_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="10132" name="__module.model.layers.42.mlp.down_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7272,hidden_states.1287"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="10133" name="__module.model.layers.42/aten::add/Add_1" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7273,7275,7283,7294,hidden_states.1289,hidden_states.1291"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="10134" name="Constant_290481" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 5120" offset="6930491512" size="20480" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="10135" name="Constant_290480" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064860" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10136" name="Constant_290478" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064864" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10137" name="__module.model.layers.43.input_layernorm/aten::pow/Power" type="Power" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7284"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="10138" name="Constant_29422" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64" names="7285"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10139" name="__module.model.layers.43.input_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> + <data keep_dims="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7286,variance.173"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10140" name="Constant_290479" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064876" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10141" name="__module.model.layers.43.input_layernorm/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7287"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10142" name="__module.model.layers.43.input_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10143" name="__module.model.layers.43.input_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7288"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10144" name="__module.model.layers.43.input_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7289,7290,hidden_states.1293,hidden_states.1295"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="10145" name="__module.model.layers.43.input_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7291,7293,hidden_states.1297"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="10146" name="self.model.layers.43.self_attn.q_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 128" offset="6930511992" size="13107200" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10147" name="Convert_386887" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10148" name="self.model.layers.43.self_attn.q_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 1" offset="6943619192" size="102400" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10149" name="Convert_386889" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10150" name="self.model.layers.43.self_attn.q_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10151" name="self.model.layers.43.self_attn.q_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="5120, 40, 1" offset="6943721592" size="409600" /> + <output> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10152" name="self.model.layers.43.self_attn.q_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10153" name="Constant_386894" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="792684080" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="10154" name="Reshape_386895" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="10155" name="__module.model.layers.43.self_attn.q_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="10156" name="__module.model.layers.43.self_attn.q_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="10157" name="self.model.layers.43.self_attn.q_proj.bias" type="Const" version="opset1"> + <data element_type="bf16" shape="5120" offset="6944131192" size="10240" /> + <output> + <port id="0" precision="BF16" names="self.model.layers.43.self_attn.q_proj.bias"> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="10158" name="__module.model.layers.43.self_attn.q_proj/prim::PythonOp/ConvertLike_1" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="BF16"> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="10159" name="__module.model.layers.43.self_attn.q_proj/prim::PythonOp/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7303,query_states.87"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="10160" name="Constant_301955" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="792694336" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="10161" name="__module.model.layers.43.self_attn/aten::view/Reshape" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7311"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10162" name="__module.model.layers.43.self_attn/aten::transpose/ScatterElementsUpdate" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="10163" name="__module.model.layers.43.self_attn/aten::transpose/Transpose" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7312,q.87"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10164" name="__module.model.layers.43.self_attn/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7321"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10165" name="__module.model.layers.43.self_attn/aten::size/ShapeOf_3" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="10166" name="__module.model.layers.43.self_attn/aten::size/Constant_3" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="10167" name="__module.model.layers.43.self_attn/aten::size/Gather_3" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="7322,7327" /> + </output> + </layer> + <layer id="10168" name="__module.model.layers.43.self_attn/aten::floor_divide/Divide_1" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" /> + </output> + </layer> + <layer id="10169" name="__module.model.layers.43.self_attn/aten::floor_divide/Floor_1" type="Floor" version="opset1"> + <input> + <port id="0" precision="I64" /> + </input> + <output> + <port id="1" precision="I64" names="7324,7325,7329,7330" /> + </output> + </layer> + <layer id="10170" name="Constant_221190" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10171" name="__module.model.layers.43.self_attn/aten::slice/Reshape_5" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10172" name="__module.model.layers.43.self_attn/aten::slice/Reshape_1" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694676" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10173" name="__module.model.layers.43.self_attn/aten::slice/Reshape_2" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10174" name="__module.model.layers.43.self_attn/aten::slice/Reshape_3" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10175" name="__module.model.layers.43.self_attn/aten::slice/Slice" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="7331,x2.173"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="10176" name="Constant_290482" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1, 1" offset="792694684" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10177" name="__module.model.layers.43.self_attn/aten::neg/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7332"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="10178" name="__module.model.layers.43.self_attn/aten::slice/Reshape_4" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10179" name="__module.model.layers.43.self_attn/aten::slice/Reshape_6" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10180" name="__module.model.layers.43.self_attn/aten::slice/Reshape_7" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10181" name="__module.model.layers.43.self_attn/aten::slice/Slice_1" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="7326"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="10182" name="__module.model.layers.43.self_attn/aten::cat/Concat" type="Concat" version="opset1"> + <data axis="-1" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7334"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10183" name="__module.model.layers.43.self_attn/aten::mul/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7335"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10184" name="__module.model.layers.43.self_attn/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7336"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10185" name="Constant_341893" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="10186" name="Constant_341886" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="12" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10187" name="Constant_341888" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10188" name="Constant_341890" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="20" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10189" name="Concat_341891" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="10190" name="Broadcast_341894" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32" /> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10191" name="ReadValue_333228" type="ReadValue" version="opset6"> + <data variable_id="past_key_values.43.keypresent.43.key" variable_type="f32" variable_shape="?,8,?,128" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="past_key_values.43.key"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10192" name="Constant_325567" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="10193" name="Gather_325568" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10194" name="self.model.layers.43.self_attn.k_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 128" offset="6944141432" size="2621440" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10195" name="Convert_387847" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10196" name="self.model.layers.43.self_attn.k_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 1" offset="6946762872" size="20480" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10197" name="Convert_387849" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10198" name="self.model.layers.43.self_attn.k_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10199" name="self.model.layers.43.self_attn.k_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="1024, 40, 1" offset="6946783352" size="81920" /> + <output> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10200" name="self.model.layers.43.self_attn.k_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10201" name="Constant_387854" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795418528" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="10202" name="Reshape_387855" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="10203" name="__module.model.layers.43.self_attn.k_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="10204" name="__module.model.layers.43.self_attn.k_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="10205" name="self.model.layers.43.self_attn.k_proj.bias" type="Const" version="opset1"> + <data element_type="bf16" shape="1024" offset="6946865272" size="2048" /> + <output> + <port id="0" precision="BF16" names="self.model.layers.43.self_attn.k_proj.bias"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="10206" name="__module.model.layers.43.self_attn.k_proj/prim::PythonOp/ConvertLike_1" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="BF16"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="10207" name="__module.model.layers.43.self_attn.k_proj/prim::PythonOp/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7306,key_states.177"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="10208" name="Constant_301956" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420592" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="10209" name="__module.model.layers.43.self_attn/aten::view/Reshape_1" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7314"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10210" name="__module.model.layers.43.self_attn/aten::transpose/ScatterElementsUpdate_1" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="10211" name="__module.model.layers.43.self_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7315,k.87"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10212" name="__module.model.layers.43.self_attn/aten::mul/Multiply_2" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7337"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10213" name="__module.model.layers.43.self_attn/aten::size/ShapeOf_5" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="10214" name="__module.model.layers.43.self_attn/aten::size/Constant_5" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="10215" name="__module.model.layers.43.self_attn/aten::size/Gather_5" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="7338,7343" /> + </output> + </layer> + <layer id="10216" name="__module.model.layers.43.self_attn/aten::floor_divide/Divide_3" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" /> + </output> + </layer> + <layer id="10217" name="__module.model.layers.43.self_attn/aten::floor_divide/Floor_3" type="Floor" version="opset1"> + <input> + <port id="0" precision="I64" /> + </input> + <output> + <port id="1" precision="I64" names="7340,7341,7345,7346" /> + </output> + </layer> + <layer id="10218" name="Constant_221191" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10219" name="__module.model.layers.43.self_attn/aten::slice/Reshape_13" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10220" name="__module.model.layers.43.self_attn/aten::slice/Reshape_9" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694676" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10221" name="__module.model.layers.43.self_attn/aten::slice/Reshape_10" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10222" name="__module.model.layers.43.self_attn/aten::slice/Reshape_11" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10223" name="__module.model.layers.43.self_attn/aten::slice/Slice_2" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="7347,x2.175"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="10224" name="Constant_290483" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1, 1" offset="792694684" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10225" name="__module.model.layers.43.self_attn/aten::neg/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7348"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="10226" name="__module.model.layers.43.self_attn/aten::slice/Reshape_12" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10227" name="__module.model.layers.43.self_attn/aten::slice/Reshape_14" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10228" name="__module.model.layers.43.self_attn/aten::slice/Reshape_15" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10229" name="__module.model.layers.43.self_attn/aten::slice/Slice_3" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="7342"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="10230" name="__module.model.layers.43.self_attn/aten::cat/Concat_1" type="Concat" version="opset1"> + <data axis="-1" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7350"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10231" name="__module.model.layers.43.self_attn/aten::mul/Multiply_3" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7351"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10232" name="__module.model.layers.43.self_attn/aten::add/Add_1" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7352"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10233" name="__module.model.layers.43.self_attn/aten::cat/Concat_2" type="Concat" version="opset1"> + <data axis="-2" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="present.43.key"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10234" name="__module.model.layers.43.self_attn/aten::unsqueeze/Unsqueeze_2" type="Unsqueeze" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="FP32" names="7364,7365,7366"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10235" name="__module.model.layers.43.self_attn/aten::size/ShapeOf_6" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="10236" name="Constant_302579" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="938477672" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="10237" name="Constant_302580" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="10238" name="Gather_302581" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="10239" name="Constant_269382" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="795420624" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10240" name="Constant_277696" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795420632" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="10241" name="Constant_277697" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="10242" name="Gather_277698" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="10243" name="__module.model.layers.43.self_attn/prim::ListConstruct/Concat_2" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="3" precision="I64" names="7367"> + <dim>5</dim> + </port> + </output> + </layer> + <layer id="10244" name="__module.model.layers.43.self_attn/aten::expand/Broadcast" type="Broadcast" version="opset3"> + <data mode="bidirectional" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>5</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7368,hidden_states.1301"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10245" name="Constant_301957" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420648" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="10246" name="__module.model.layers.43.self_attn/aten::reshape/Reshape" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7372,key_states.179"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10247" name="Constant_341906" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="10248" name="Constant_341899" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="12" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10249" name="Constant_341901" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10250" name="Constant_341903" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="20" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10251" name="Concat_341904" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="10252" name="Broadcast_341907" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32" /> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10253" name="ReadValue_333230" type="ReadValue" version="opset6"> + <data variable_id="past_key_values.43.valuepresent.43.value" variable_type="f32" variable_shape="?,8,?,128" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="past_key_values.43.value"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10254" name="Constant_325570" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="10255" name="Gather_325571" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10256" name="self.model.layers.43.self_attn.v_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 128" offset="6946867320" size="2621440" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10257" name="Convert_387857" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10258" name="self.model.layers.43.self_attn.v_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 1" offset="6949488760" size="20480" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10259" name="Convert_387859" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10260" name="self.model.layers.43.self_attn.v_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10261" name="self.model.layers.43.self_attn.v_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="1024, 40, 1" offset="6949509240" size="81920" /> + <output> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10262" name="self.model.layers.43.self_attn.v_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10263" name="Constant_387864" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795418528" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="10264" name="Reshape_387865" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="10265" name="__module.model.layers.43.self_attn.v_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="10266" name="__module.model.layers.43.self_attn.v_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="10267" name="self.model.layers.43.self_attn.v_proj.bias" type="Const" version="opset1"> + <data element_type="bf16" shape="1024" offset="6949591160" size="2048" /> + <output> + <port id="0" precision="BF16" names="self.model.layers.43.self_attn.v_proj.bias"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="10268" name="__module.model.layers.43.self_attn.v_proj/prim::PythonOp/ConvertLike_1" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="BF16"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="10269" name="__module.model.layers.43.self_attn.v_proj/prim::PythonOp/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7309,value_states.87"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="10270" name="Constant_301958" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420592" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="10271" name="__module.model.layers.43.self_attn/aten::view/Reshape_2" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7317"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10272" name="__module.model.layers.43.self_attn/aten::transpose/ScatterElementsUpdate_2" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="10273" name="__module.model.layers.43.self_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7318"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10274" name="__module.model.layers.43.self_attn/aten::cat/Concat_3" type="Concat" version="opset1"> + <data axis="-2" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="present.43.value"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10275" name="__module.model.layers.43.self_attn/aten::unsqueeze/Unsqueeze_3" type="Unsqueeze" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="FP32" names="7380,7381,7382"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10276" name="__module.model.layers.43.self_attn/aten::size/ShapeOf_10" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="10277" name="Constant_302343" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10278" name="__module.model.layers.43.self_attn/aten::size/Constant_11" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="10279" name="__module.model.layers.43.self_attn/aten::size/Gather_11" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="7374"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10280" name="Constant_269400" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="795420624" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10281" name="Constant_277706" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795420632" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="10282" name="Constant_277707" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="10283" name="Gather_277708" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="10284" name="__module.model.layers.43.self_attn/prim::ListConstruct/Concat_5" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="4" precision="I64" names="7383"> + <dim>5</dim> + </port> + </output> + </layer> + <layer id="10285" name="__module.model.layers.43.self_attn/aten::expand/Broadcast_1" type="Broadcast" version="opset3"> + <data mode="bidirectional" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>5</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7384,hidden_states.1305"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10286" name="Constant_301959" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420648" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="10287" name="__module.model.layers.43.self_attn/aten::reshape/Reshape_1" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7388"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10288" name="__module.model.layers.43.self_attn/aten::slice/Reshape_60" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10289" name="ShapeOf_301278" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="10290" name="Constant_301279" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694668" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10291" name="Constant_301280" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="10292" name="Gather_301281" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10293" name="ShapeOf_301282" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="10294" name="Constant_301283" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694668" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10295" name="Constant_301284" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="10296" name="Gather_301285" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10297" name="Add_301286" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64" names="7389"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10298" name="__module.model.layers.43.self_attn/aten::slice/Reshape_62" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10299" name="__module.model.layers.43.self_attn/aten::slice/Reshape_63" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10300" name="__module.model.layers.43.self_attn/aten::slice/Slice_15" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="7393"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="10301" name="__module.model.layers.43.self_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> + <data causal="false" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="7394,attn_output.173"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10302" name="__module.model.layers.43.self_attn/aten::transpose/ScatterElementsUpdate_3" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="10303" name="__module.model.layers.43.self_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7395"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10304" name="Constant_301960" type="Const" version="opset1"> + <data element_type="i64" shape="3" offset="798146608" size="24" /> + <output> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="10305" name="__module.model.layers.43.self_attn/aten::view/Reshape_3" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>3</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7398"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="10306" name="self.model.layers.43.self_attn.o_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 128" offset="6949593208" size="13107200" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10307" name="Convert_386897" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10308" name="self.model.layers.43.self_attn.o_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 1" offset="6962700408" size="102400" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10309" name="Convert_386899" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10310" name="self.model.layers.43.self_attn.o_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10311" name="self.model.layers.43.self_attn.o_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="5120, 40, 1" offset="6962802808" size="409600" /> + <output> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10312" name="self.model.layers.43.self_attn.o_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10313" name="Constant_386904" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="792684080" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="10314" name="Reshape_386905" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="10315" name="__module.model.layers.43.self_attn.o_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="10316" name="__module.model.layers.43.self_attn.o_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7400,7402,hidden_states.1307"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="10317" name="__module.model.layers.43/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7405,7407,7418,hidden_states.1309,hidden_states.1311"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="10318" name="Constant_290487" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 5120" offset="6963212408" size="20480" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="10319" name="Constant_290486" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064860" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10320" name="Constant_290484" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064864" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10321" name="__module.model.layers.43.post_attention_layernorm/aten::pow/Power" type="Power" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7408"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="10322" name="Constant_30020" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64" names="7409"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10323" name="__module.model.layers.43.post_attention_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> + <data keep_dims="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7410,variance.175"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10324" name="Constant_290485" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064876" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10325" name="__module.model.layers.43.post_attention_layernorm/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7411"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10326" name="__module.model.layers.43.post_attention_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10327" name="__module.model.layers.43.post_attention_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7412"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10328" name="__module.model.layers.43.post_attention_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7413,7414,hidden_states.1313,hidden_states.1315"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="10329" name="__module.model.layers.43.post_attention_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7415,7417"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="10330" name="self.model.layers.43.mlp.gate_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 128" offset="6963232888" size="35389440" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10331" name="Convert_385887" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10332" name="self.model.layers.43.mlp.gate_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 1" offset="6998622328" size="276480" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10333" name="Convert_385889" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10334" name="self.model.layers.43.mlp.gate_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10335" name="self.model.layers.43.mlp.gate_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="13824, 40, 1" offset="6998898808" size="1105920" /> + <output> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10336" name="self.model.layers.43.mlp.gate_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10337" name="Constant_385894" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="848558152" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="10338" name="Reshape_385895" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="10339" name="__module.model.layers.43.mlp.gate_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="10340" name="__module.model.layers.43.mlp.gate_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7423,input.87"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="10341" name="__module.model.layers.43.mlp.act_fn/aten::silu/Swish" type="Swish" version="opset4"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="7424"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="10342" name="self.model.layers.43.mlp.up_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 128" offset="7000004728" size="35389440" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10343" name="Convert_385877" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10344" name="self.model.layers.43.mlp.up_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 1" offset="7035394168" size="276480" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10345" name="Convert_385879" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10346" name="self.model.layers.43.mlp.up_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10347" name="self.model.layers.43.mlp.up_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="13824, 40, 1" offset="7035670648" size="1105920" /> + <output> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10348" name="self.model.layers.43.mlp.up_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10349" name="Constant_385884" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="848558152" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="10350" name="Reshape_385885" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="10351" name="__module.model.layers.43.mlp.up_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="10352" name="__module.model.layers.43.mlp.up_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7426"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="10353" name="__module.model.layers.43.mlp/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7427"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="10354" name="self.model.layers.43.mlp.down_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 108, 128" offset="7036776568" size="35389440" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10355" name="Convert_385897" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10356" name="self.model.layers.43.mlp.down_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 108, 1" offset="7072166008" size="276480" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10357" name="Convert_385899" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10358" name="self.model.layers.43.mlp.down_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10359" name="self.model.layers.43.mlp.down_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="5120, 108, 1" offset="7072442488" size="1105920" /> + <output> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10360" name="self.model.layers.43.mlp.down_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10361" name="Constant_385904" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="922101848" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="10362" name="Reshape_385905" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="10363" name="__module.model.layers.43.mlp.down_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="10364" name="__module.model.layers.43.mlp.down_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7429,hidden_states.1317"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="10365" name="__module.model.layers.43/aten::add/Add_1" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7430,7432,7440,7451,hidden_states.1319,hidden_states.1321"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="10366" name="Constant_290491" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 5120" offset="7073548408" size="20480" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="10367" name="Constant_290490" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064860" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10368" name="Constant_290488" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064864" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10369" name="__module.model.layers.44.input_layernorm/aten::pow/Power" type="Power" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7441"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="10370" name="Constant_30094" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64" names="7442"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10371" name="__module.model.layers.44.input_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> + <data keep_dims="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7443,variance.177"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10372" name="Constant_290489" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064876" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10373" name="__module.model.layers.44.input_layernorm/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7444"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10374" name="__module.model.layers.44.input_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10375" name="__module.model.layers.44.input_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7445"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10376" name="__module.model.layers.44.input_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7446,7447,hidden_states.1323,hidden_states.1325"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="10377" name="__module.model.layers.44.input_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7448,7450,hidden_states.1327"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="10378" name="self.model.layers.44.self_attn.q_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 128" offset="7073568888" size="13107200" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10379" name="Convert_386907" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10380" name="self.model.layers.44.self_attn.q_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 1" offset="7086676088" size="102400" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10381" name="Convert_386909" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10382" name="self.model.layers.44.self_attn.q_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10383" name="self.model.layers.44.self_attn.q_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="5120, 40, 1" offset="7086778488" size="409600" /> + <output> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10384" name="self.model.layers.44.self_attn.q_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10385" name="Constant_386914" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="792684080" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="10386" name="Reshape_386915" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="10387" name="__module.model.layers.44.self_attn.q_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="10388" name="__module.model.layers.44.self_attn.q_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="10389" name="self.model.layers.44.self_attn.q_proj.bias" type="Const" version="opset1"> + <data element_type="bf16" shape="5120" offset="7087188088" size="10240" /> + <output> + <port id="0" precision="BF16" names="self.model.layers.44.self_attn.q_proj.bias"> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="10390" name="__module.model.layers.44.self_attn.q_proj/prim::PythonOp/ConvertLike_1" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="BF16"> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="10391" name="__module.model.layers.44.self_attn.q_proj/prim::PythonOp/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7460,query_states.89"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="10392" name="Constant_301961" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="792694336" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="10393" name="__module.model.layers.44.self_attn/aten::view/Reshape" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7468"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10394" name="__module.model.layers.44.self_attn/aten::transpose/ScatterElementsUpdate" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="10395" name="__module.model.layers.44.self_attn/aten::transpose/Transpose" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7469,q.89"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10396" name="__module.model.layers.44.self_attn/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7478"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10397" name="__module.model.layers.44.self_attn/aten::size/ShapeOf_3" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="10398" name="__module.model.layers.44.self_attn/aten::size/Constant_3" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="10399" name="__module.model.layers.44.self_attn/aten::size/Gather_3" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="7479,7484" /> + </output> + </layer> + <layer id="10400" name="__module.model.layers.44.self_attn/aten::floor_divide/Divide_1" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" /> + </output> + </layer> + <layer id="10401" name="__module.model.layers.44.self_attn/aten::floor_divide/Floor_1" type="Floor" version="opset1"> + <input> + <port id="0" precision="I64" /> + </input> + <output> + <port id="1" precision="I64" names="7481,7482,7486,7487" /> + </output> + </layer> + <layer id="10402" name="Constant_221205" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10403" name="__module.model.layers.44.self_attn/aten::slice/Reshape_5" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10404" name="__module.model.layers.44.self_attn/aten::slice/Reshape_1" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694676" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10405" name="__module.model.layers.44.self_attn/aten::slice/Reshape_2" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10406" name="__module.model.layers.44.self_attn/aten::slice/Reshape_3" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10407" name="__module.model.layers.44.self_attn/aten::slice/Slice" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="7488,x2.177"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="10408" name="Constant_290492" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1, 1" offset="792694684" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10409" name="__module.model.layers.44.self_attn/aten::neg/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7489"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="10410" name="__module.model.layers.44.self_attn/aten::slice/Reshape_4" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10411" name="__module.model.layers.44.self_attn/aten::slice/Reshape_6" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10412" name="__module.model.layers.44.self_attn/aten::slice/Reshape_7" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10413" name="__module.model.layers.44.self_attn/aten::slice/Slice_1" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="7483"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="10414" name="__module.model.layers.44.self_attn/aten::cat/Concat" type="Concat" version="opset1"> + <data axis="-1" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7491"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10415" name="__module.model.layers.44.self_attn/aten::mul/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7492"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10416" name="__module.model.layers.44.self_attn/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7493"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10417" name="Constant_341919" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="10418" name="Constant_341912" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="12" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10419" name="Constant_341914" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10420" name="Constant_341916" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="20" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10421" name="Concat_341917" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="10422" name="Broadcast_341920" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32" /> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10423" name="ReadValue_333232" type="ReadValue" version="opset6"> + <data variable_id="past_key_values.44.keypresent.44.key" variable_type="f32" variable_shape="?,8,?,128" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="past_key_values.44.key"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10424" name="Constant_325573" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="10425" name="Gather_325574" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10426" name="self.model.layers.44.self_attn.k_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 128" offset="7087198328" size="2621440" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10427" name="Convert_387867" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10428" name="self.model.layers.44.self_attn.k_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 1" offset="7089819768" size="20480" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10429" name="Convert_387869" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10430" name="self.model.layers.44.self_attn.k_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10431" name="self.model.layers.44.self_attn.k_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="1024, 40, 1" offset="7089840248" size="81920" /> + <output> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10432" name="self.model.layers.44.self_attn.k_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10433" name="Constant_387874" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795418528" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="10434" name="Reshape_387875" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="10435" name="__module.model.layers.44.self_attn.k_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="10436" name="__module.model.layers.44.self_attn.k_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="10437" name="self.model.layers.44.self_attn.k_proj.bias" type="Const" version="opset1"> + <data element_type="bf16" shape="1024" offset="7089922168" size="2048" /> + <output> + <port id="0" precision="BF16" names="self.model.layers.44.self_attn.k_proj.bias"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="10438" name="__module.model.layers.44.self_attn.k_proj/prim::PythonOp/ConvertLike_1" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="BF16"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="10439" name="__module.model.layers.44.self_attn.k_proj/prim::PythonOp/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7463,key_states.181"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="10440" name="Constant_301962" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420592" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="10441" name="__module.model.layers.44.self_attn/aten::view/Reshape_1" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7471"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10442" name="__module.model.layers.44.self_attn/aten::transpose/ScatterElementsUpdate_1" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="10443" name="__module.model.layers.44.self_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7472,k.89"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10444" name="__module.model.layers.44.self_attn/aten::mul/Multiply_2" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7494"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10445" name="__module.model.layers.44.self_attn/aten::size/ShapeOf_5" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="10446" name="__module.model.layers.44.self_attn/aten::size/Constant_5" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="10447" name="__module.model.layers.44.self_attn/aten::size/Gather_5" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="7495,7500" /> + </output> + </layer> + <layer id="10448" name="__module.model.layers.44.self_attn/aten::floor_divide/Divide_3" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" /> + </output> + </layer> + <layer id="10449" name="__module.model.layers.44.self_attn/aten::floor_divide/Floor_3" type="Floor" version="opset1"> + <input> + <port id="0" precision="I64" /> + </input> + <output> + <port id="1" precision="I64" names="7497,7498,7502,7503" /> + </output> + </layer> + <layer id="10450" name="Constant_221206" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10451" name="__module.model.layers.44.self_attn/aten::slice/Reshape_13" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10452" name="__module.model.layers.44.self_attn/aten::slice/Reshape_9" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694676" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10453" name="__module.model.layers.44.self_attn/aten::slice/Reshape_10" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10454" name="__module.model.layers.44.self_attn/aten::slice/Reshape_11" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10455" name="__module.model.layers.44.self_attn/aten::slice/Slice_2" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="7504,x2.179"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="10456" name="Constant_290493" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1, 1" offset="792694684" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10457" name="__module.model.layers.44.self_attn/aten::neg/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7505"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="10458" name="__module.model.layers.44.self_attn/aten::slice/Reshape_12" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10459" name="__module.model.layers.44.self_attn/aten::slice/Reshape_14" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10460" name="__module.model.layers.44.self_attn/aten::slice/Reshape_15" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10461" name="__module.model.layers.44.self_attn/aten::slice/Slice_3" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="7499"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="10462" name="__module.model.layers.44.self_attn/aten::cat/Concat_1" type="Concat" version="opset1"> + <data axis="-1" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7507"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10463" name="__module.model.layers.44.self_attn/aten::mul/Multiply_3" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7508"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10464" name="__module.model.layers.44.self_attn/aten::add/Add_1" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7509"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10465" name="__module.model.layers.44.self_attn/aten::cat/Concat_2" type="Concat" version="opset1"> + <data axis="-2" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="present.44.key"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10466" name="__module.model.layers.44.self_attn/aten::unsqueeze/Unsqueeze_2" type="Unsqueeze" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="FP32" names="7521,7522,7523"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10467" name="__module.model.layers.44.self_attn/aten::size/ShapeOf_6" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="10468" name="Constant_302584" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="938477672" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="10469" name="Constant_302585" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="10470" name="Gather_302586" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="10471" name="Constant_269418" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="795420624" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10472" name="Constant_277731" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795420632" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="10473" name="Constant_277732" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="10474" name="Gather_277733" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="10475" name="__module.model.layers.44.self_attn/prim::ListConstruct/Concat_2" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="3" precision="I64" names="7524"> + <dim>5</dim> + </port> + </output> + </layer> + <layer id="10476" name="__module.model.layers.44.self_attn/aten::expand/Broadcast" type="Broadcast" version="opset3"> + <data mode="bidirectional" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>5</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7525,hidden_states.1331"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10477" name="Constant_301963" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420648" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="10478" name="__module.model.layers.44.self_attn/aten::reshape/Reshape" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7529,key_states.183"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10479" name="Constant_341932" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="10480" name="Constant_341925" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="12" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10481" name="Constant_341927" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10482" name="Constant_341929" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="20" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10483" name="Concat_341930" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="10484" name="Broadcast_341933" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32" /> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10485" name="ReadValue_333234" type="ReadValue" version="opset6"> + <data variable_id="past_key_values.44.valuepresent.44.value" variable_type="f32" variable_shape="?,8,?,128" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="past_key_values.44.value"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10486" name="Constant_325576" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="10487" name="Gather_325577" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10488" name="self.model.layers.44.self_attn.v_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 128" offset="7089924216" size="2621440" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10489" name="Convert_387877" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10490" name="self.model.layers.44.self_attn.v_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 1" offset="7092545656" size="20480" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10491" name="Convert_387879" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10492" name="self.model.layers.44.self_attn.v_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10493" name="self.model.layers.44.self_attn.v_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="1024, 40, 1" offset="7092566136" size="81920" /> + <output> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10494" name="self.model.layers.44.self_attn.v_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10495" name="Constant_387884" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795418528" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="10496" name="Reshape_387885" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="10497" name="__module.model.layers.44.self_attn.v_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="10498" name="__module.model.layers.44.self_attn.v_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="10499" name="self.model.layers.44.self_attn.v_proj.bias" type="Const" version="opset1"> + <data element_type="bf16" shape="1024" offset="7092648056" size="2048" /> + <output> + <port id="0" precision="BF16" names="self.model.layers.44.self_attn.v_proj.bias"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="10500" name="__module.model.layers.44.self_attn.v_proj/prim::PythonOp/ConvertLike_1" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="BF16"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="10501" name="__module.model.layers.44.self_attn.v_proj/prim::PythonOp/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7466,value_states.89"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="10502" name="Constant_301964" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420592" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="10503" name="__module.model.layers.44.self_attn/aten::view/Reshape_2" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7474"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10504" name="__module.model.layers.44.self_attn/aten::transpose/ScatterElementsUpdate_2" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="10505" name="__module.model.layers.44.self_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7475"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10506" name="__module.model.layers.44.self_attn/aten::cat/Concat_3" type="Concat" version="opset1"> + <data axis="-2" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="present.44.value"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10507" name="__module.model.layers.44.self_attn/aten::unsqueeze/Unsqueeze_3" type="Unsqueeze" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="FP32" names="7537,7538,7539"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10508" name="__module.model.layers.44.self_attn/aten::size/ShapeOf_10" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="10509" name="Constant_302349" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10510" name="__module.model.layers.44.self_attn/aten::size/Constant_11" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="10511" name="__module.model.layers.44.self_attn/aten::size/Gather_11" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="7531"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10512" name="Constant_269436" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="795420624" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10513" name="Constant_277741" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795420632" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="10514" name="Constant_277742" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="10515" name="Gather_277743" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="10516" name="__module.model.layers.44.self_attn/prim::ListConstruct/Concat_5" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="4" precision="I64" names="7540"> + <dim>5</dim> + </port> + </output> + </layer> + <layer id="10517" name="__module.model.layers.44.self_attn/aten::expand/Broadcast_1" type="Broadcast" version="opset3"> + <data mode="bidirectional" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>5</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7541,hidden_states.1335"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10518" name="Constant_301965" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420648" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="10519" name="__module.model.layers.44.self_attn/aten::reshape/Reshape_1" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7545"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10520" name="__module.model.layers.44.self_attn/aten::slice/Reshape_60" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10521" name="ShapeOf_301364" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="10522" name="Constant_301365" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694668" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10523" name="Constant_301366" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="10524" name="Gather_301367" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10525" name="ShapeOf_301368" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="10526" name="Constant_301369" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694668" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10527" name="Constant_301370" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="10528" name="Gather_301371" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10529" name="Add_301372" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64" names="7546"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10530" name="__module.model.layers.44.self_attn/aten::slice/Reshape_62" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10531" name="__module.model.layers.44.self_attn/aten::slice/Reshape_63" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10532" name="__module.model.layers.44.self_attn/aten::slice/Slice_15" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="7550"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="10533" name="__module.model.layers.44.self_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> + <data causal="false" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="7551,attn_output.177"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10534" name="__module.model.layers.44.self_attn/aten::transpose/ScatterElementsUpdate_3" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="10535" name="__module.model.layers.44.self_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7552"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10536" name="Constant_301966" type="Const" version="opset1"> + <data element_type="i64" shape="3" offset="798146608" size="24" /> + <output> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="10537" name="__module.model.layers.44.self_attn/aten::view/Reshape_3" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>3</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7555"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="10538" name="self.model.layers.44.self_attn.o_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 128" offset="7092650104" size="13107200" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10539" name="Convert_386917" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10540" name="self.model.layers.44.self_attn.o_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 1" offset="7105757304" size="102400" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10541" name="Convert_386919" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10542" name="self.model.layers.44.self_attn.o_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10543" name="self.model.layers.44.self_attn.o_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="5120, 40, 1" offset="7105859704" size="409600" /> + <output> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10544" name="self.model.layers.44.self_attn.o_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10545" name="Constant_386924" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="792684080" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="10546" name="Reshape_386925" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="10547" name="__module.model.layers.44.self_attn.o_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="10548" name="__module.model.layers.44.self_attn.o_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7557,7559,hidden_states.1337"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="10549" name="__module.model.layers.44/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7562,7564,7575,hidden_states.1339,hidden_states.1341"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="10550" name="Constant_290497" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 5120" offset="7106269304" size="20480" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="10551" name="Constant_290496" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064860" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10552" name="Constant_290494" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064864" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10553" name="__module.model.layers.44.post_attention_layernorm/aten::pow/Power" type="Power" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7565"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="10554" name="Constant_30692" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64" names="7566"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10555" name="__module.model.layers.44.post_attention_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> + <data keep_dims="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7567,variance.179"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10556" name="Constant_290495" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064876" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10557" name="__module.model.layers.44.post_attention_layernorm/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7568"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10558" name="__module.model.layers.44.post_attention_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10559" name="__module.model.layers.44.post_attention_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7569"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10560" name="__module.model.layers.44.post_attention_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7570,7571,hidden_states.1343,hidden_states.1345"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="10561" name="__module.model.layers.44.post_attention_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7572,7574"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="10562" name="self.model.layers.44.mlp.gate_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 128" offset="7106289784" size="35389440" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10563" name="Convert_385917" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10564" name="self.model.layers.44.mlp.gate_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 1" offset="7141679224" size="276480" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10565" name="Convert_385919" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10566" name="self.model.layers.44.mlp.gate_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10567" name="self.model.layers.44.mlp.gate_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="13824, 40, 1" offset="7141955704" size="1105920" /> + <output> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10568" name="self.model.layers.44.mlp.gate_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10569" name="Constant_385924" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="848558152" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="10570" name="Reshape_385925" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="10571" name="__module.model.layers.44.mlp.gate_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="10572" name="__module.model.layers.44.mlp.gate_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7580,input.89"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="10573" name="__module.model.layers.44.mlp.act_fn/aten::silu/Swish" type="Swish" version="opset4"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="7581"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="10574" name="self.model.layers.44.mlp.up_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 128" offset="7143061624" size="35389440" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10575" name="Convert_385907" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10576" name="self.model.layers.44.mlp.up_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 1" offset="7178451064" size="276480" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10577" name="Convert_385909" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10578" name="self.model.layers.44.mlp.up_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10579" name="self.model.layers.44.mlp.up_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="13824, 40, 1" offset="7178727544" size="1105920" /> + <output> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10580" name="self.model.layers.44.mlp.up_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10581" name="Constant_385914" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="848558152" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="10582" name="Reshape_385915" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="10583" name="__module.model.layers.44.mlp.up_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="10584" name="__module.model.layers.44.mlp.up_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7583"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="10585" name="__module.model.layers.44.mlp/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7584"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="10586" name="self.model.layers.44.mlp.down_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 108, 128" offset="7179833464" size="35389440" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10587" name="Convert_385927" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10588" name="self.model.layers.44.mlp.down_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 108, 1" offset="7215222904" size="276480" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10589" name="Convert_385929" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10590" name="self.model.layers.44.mlp.down_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10591" name="self.model.layers.44.mlp.down_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="5120, 108, 1" offset="7215499384" size="1105920" /> + <output> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10592" name="self.model.layers.44.mlp.down_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10593" name="Constant_385934" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="922101848" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="10594" name="Reshape_385935" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="10595" name="__module.model.layers.44.mlp.down_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="10596" name="__module.model.layers.44.mlp.down_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7586,hidden_states.1347"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="10597" name="__module.model.layers.44/aten::add/Add_1" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7587,7589,7597,7608,hidden_states.1349,hidden_states.1351"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="10598" name="Constant_290501" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 5120" offset="7216605304" size="20480" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="10599" name="Constant_290500" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064860" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10600" name="Constant_290498" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064864" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10601" name="__module.model.layers.45.input_layernorm/aten::pow/Power" type="Power" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7598"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="10602" name="Constant_30766" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64" names="7599"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10603" name="__module.model.layers.45.input_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> + <data keep_dims="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7600,variance.181"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10604" name="Constant_290499" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064876" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10605" name="__module.model.layers.45.input_layernorm/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7601"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10606" name="__module.model.layers.45.input_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10607" name="__module.model.layers.45.input_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7602"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10608" name="__module.model.layers.45.input_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7603,7604,hidden_states.1353,hidden_states.1355"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="10609" name="__module.model.layers.45.input_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7605,7607,hidden_states.1357"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="10610" name="self.model.layers.45.self_attn.q_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 128" offset="7216625784" size="13107200" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10611" name="Convert_386927" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10612" name="self.model.layers.45.self_attn.q_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 1" offset="7229732984" size="102400" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10613" name="Convert_386929" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10614" name="self.model.layers.45.self_attn.q_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10615" name="self.model.layers.45.self_attn.q_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="5120, 40, 1" offset="7229835384" size="409600" /> + <output> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10616" name="self.model.layers.45.self_attn.q_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10617" name="Constant_386934" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="792684080" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="10618" name="Reshape_386935" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="10619" name="__module.model.layers.45.self_attn.q_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="10620" name="__module.model.layers.45.self_attn.q_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="10621" name="self.model.layers.45.self_attn.q_proj.bias" type="Const" version="opset1"> + <data element_type="bf16" shape="5120" offset="7230244984" size="10240" /> + <output> + <port id="0" precision="BF16" names="self.model.layers.45.self_attn.q_proj.bias"> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="10622" name="__module.model.layers.45.self_attn.q_proj/prim::PythonOp/ConvertLike_1" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="BF16"> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="10623" name="__module.model.layers.45.self_attn.q_proj/prim::PythonOp/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7617,query_states.91"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="10624" name="Constant_301967" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="792694336" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="10625" name="__module.model.layers.45.self_attn/aten::view/Reshape" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7625"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10626" name="__module.model.layers.45.self_attn/aten::transpose/ScatterElementsUpdate" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="10627" name="__module.model.layers.45.self_attn/aten::transpose/Transpose" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7626,q.91"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10628" name="__module.model.layers.45.self_attn/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7635"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10629" name="__module.model.layers.45.self_attn/aten::size/ShapeOf_3" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="10630" name="__module.model.layers.45.self_attn/aten::size/Constant_3" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="10631" name="__module.model.layers.45.self_attn/aten::size/Gather_3" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="7636,7641" /> + </output> + </layer> + <layer id="10632" name="__module.model.layers.45.self_attn/aten::floor_divide/Divide_1" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" /> + </output> + </layer> + <layer id="10633" name="__module.model.layers.45.self_attn/aten::floor_divide/Floor_1" type="Floor" version="opset1"> + <input> + <port id="0" precision="I64" /> + </input> + <output> + <port id="1" precision="I64" names="7638,7639,7643,7644" /> + </output> + </layer> + <layer id="10634" name="Constant_221220" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10635" name="__module.model.layers.45.self_attn/aten::slice/Reshape_5" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10636" name="__module.model.layers.45.self_attn/aten::slice/Reshape_1" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694676" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10637" name="__module.model.layers.45.self_attn/aten::slice/Reshape_2" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10638" name="__module.model.layers.45.self_attn/aten::slice/Reshape_3" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10639" name="__module.model.layers.45.self_attn/aten::slice/Slice" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="7645,x2.181"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="10640" name="Constant_290502" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1, 1" offset="792694684" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10641" name="__module.model.layers.45.self_attn/aten::neg/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7646"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="10642" name="__module.model.layers.45.self_attn/aten::slice/Reshape_4" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10643" name="__module.model.layers.45.self_attn/aten::slice/Reshape_6" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10644" name="__module.model.layers.45.self_attn/aten::slice/Reshape_7" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10645" name="__module.model.layers.45.self_attn/aten::slice/Slice_1" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="7640"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="10646" name="__module.model.layers.45.self_attn/aten::cat/Concat" type="Concat" version="opset1"> + <data axis="-1" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7648"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10647" name="__module.model.layers.45.self_attn/aten::mul/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7649"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10648" name="__module.model.layers.45.self_attn/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7650"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10649" name="Constant_341945" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="10650" name="Constant_341938" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="12" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10651" name="Constant_341940" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10652" name="Constant_341942" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="20" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10653" name="Concat_341943" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="10654" name="Broadcast_341946" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32" /> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10655" name="ReadValue_333236" type="ReadValue" version="opset6"> + <data variable_id="past_key_values.45.keypresent.45.key" variable_type="f32" variable_shape="?,8,?,128" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="past_key_values.45.key"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10656" name="Constant_325579" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="10657" name="Gather_325580" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10658" name="self.model.layers.45.self_attn.k_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 128" offset="7230255224" size="2621440" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10659" name="Convert_387887" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10660" name="self.model.layers.45.self_attn.k_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 1" offset="7232876664" size="20480" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10661" name="Convert_387889" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10662" name="self.model.layers.45.self_attn.k_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10663" name="self.model.layers.45.self_attn.k_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="1024, 40, 1" offset="7232897144" size="81920" /> + <output> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10664" name="self.model.layers.45.self_attn.k_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10665" name="Constant_387894" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795418528" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="10666" name="Reshape_387895" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="10667" name="__module.model.layers.45.self_attn.k_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="10668" name="__module.model.layers.45.self_attn.k_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="10669" name="self.model.layers.45.self_attn.k_proj.bias" type="Const" version="opset1"> + <data element_type="bf16" shape="1024" offset="7232979064" size="2048" /> + <output> + <port id="0" precision="BF16" names="self.model.layers.45.self_attn.k_proj.bias"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="10670" name="__module.model.layers.45.self_attn.k_proj/prim::PythonOp/ConvertLike_1" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="BF16"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="10671" name="__module.model.layers.45.self_attn.k_proj/prim::PythonOp/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7620,key_states.185"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="10672" name="Constant_301968" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420592" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="10673" name="__module.model.layers.45.self_attn/aten::view/Reshape_1" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7628"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10674" name="__module.model.layers.45.self_attn/aten::transpose/ScatterElementsUpdate_1" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="10675" name="__module.model.layers.45.self_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7629,k.91"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10676" name="__module.model.layers.45.self_attn/aten::mul/Multiply_2" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7651"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10677" name="__module.model.layers.45.self_attn/aten::size/ShapeOf_5" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="10678" name="__module.model.layers.45.self_attn/aten::size/Constant_5" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="10679" name="__module.model.layers.45.self_attn/aten::size/Gather_5" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="7652,7657" /> + </output> + </layer> + <layer id="10680" name="__module.model.layers.45.self_attn/aten::floor_divide/Divide_3" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" /> + </output> + </layer> + <layer id="10681" name="__module.model.layers.45.self_attn/aten::floor_divide/Floor_3" type="Floor" version="opset1"> + <input> + <port id="0" precision="I64" /> + </input> + <output> + <port id="1" precision="I64" names="7654,7655,7659,7660" /> + </output> + </layer> + <layer id="10682" name="Constant_221221" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10683" name="__module.model.layers.45.self_attn/aten::slice/Reshape_13" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10684" name="__module.model.layers.45.self_attn/aten::slice/Reshape_9" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694676" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10685" name="__module.model.layers.45.self_attn/aten::slice/Reshape_10" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10686" name="__module.model.layers.45.self_attn/aten::slice/Reshape_11" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10687" name="__module.model.layers.45.self_attn/aten::slice/Slice_2" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="7661,x2.183"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="10688" name="Constant_290503" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1, 1" offset="792694684" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10689" name="__module.model.layers.45.self_attn/aten::neg/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7662"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="10690" name="__module.model.layers.45.self_attn/aten::slice/Reshape_12" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10691" name="__module.model.layers.45.self_attn/aten::slice/Reshape_14" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10692" name="__module.model.layers.45.self_attn/aten::slice/Reshape_15" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10693" name="__module.model.layers.45.self_attn/aten::slice/Slice_3" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="7656"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="10694" name="__module.model.layers.45.self_attn/aten::cat/Concat_1" type="Concat" version="opset1"> + <data axis="-1" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7664"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10695" name="__module.model.layers.45.self_attn/aten::mul/Multiply_3" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7665"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10696" name="__module.model.layers.45.self_attn/aten::add/Add_1" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7666"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10697" name="__module.model.layers.45.self_attn/aten::cat/Concat_2" type="Concat" version="opset1"> + <data axis="-2" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="present.45.key"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10698" name="__module.model.layers.45.self_attn/aten::unsqueeze/Unsqueeze_2" type="Unsqueeze" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="FP32" names="7678,7679,7680"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10699" name="__module.model.layers.45.self_attn/aten::size/ShapeOf_6" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="10700" name="Constant_302589" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="938477672" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="10701" name="Constant_302590" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="10702" name="Gather_302591" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="10703" name="Constant_269454" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="795420624" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10704" name="Constant_277766" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795420632" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="10705" name="Constant_277767" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="10706" name="Gather_277768" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="10707" name="__module.model.layers.45.self_attn/prim::ListConstruct/Concat_2" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="3" precision="I64" names="7681"> + <dim>5</dim> + </port> + </output> + </layer> + <layer id="10708" name="__module.model.layers.45.self_attn/aten::expand/Broadcast" type="Broadcast" version="opset3"> + <data mode="bidirectional" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>5</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7682,hidden_states.1361"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10709" name="Constant_301969" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420648" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="10710" name="__module.model.layers.45.self_attn/aten::reshape/Reshape" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7686,key_states.187"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10711" name="Constant_341958" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="10712" name="Constant_341951" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="12" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10713" name="Constant_341953" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10714" name="Constant_341955" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="20" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10715" name="Concat_341956" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="10716" name="Broadcast_341959" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32" /> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10717" name="ReadValue_333238" type="ReadValue" version="opset6"> + <data variable_id="past_key_values.45.valuepresent.45.value" variable_type="f32" variable_shape="?,8,?,128" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="past_key_values.45.value"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10718" name="Constant_325582" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="10719" name="Gather_325583" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10720" name="self.model.layers.45.self_attn.v_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 128" offset="7232981112" size="2621440" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10721" name="Convert_387897" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10722" name="self.model.layers.45.self_attn.v_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 1" offset="7235602552" size="20480" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10723" name="Convert_387899" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10724" name="self.model.layers.45.self_attn.v_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10725" name="self.model.layers.45.self_attn.v_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="1024, 40, 1" offset="7235623032" size="81920" /> + <output> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10726" name="self.model.layers.45.self_attn.v_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10727" name="Constant_387904" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795418528" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="10728" name="Reshape_387905" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="10729" name="__module.model.layers.45.self_attn.v_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="10730" name="__module.model.layers.45.self_attn.v_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="10731" name="self.model.layers.45.self_attn.v_proj.bias" type="Const" version="opset1"> + <data element_type="bf16" shape="1024" offset="7235704952" size="2048" /> + <output> + <port id="0" precision="BF16" names="self.model.layers.45.self_attn.v_proj.bias"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="10732" name="__module.model.layers.45.self_attn.v_proj/prim::PythonOp/ConvertLike_1" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="BF16"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="10733" name="__module.model.layers.45.self_attn.v_proj/prim::PythonOp/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7623,value_states.91"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="10734" name="Constant_301970" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420592" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="10735" name="__module.model.layers.45.self_attn/aten::view/Reshape_2" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7631"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10736" name="__module.model.layers.45.self_attn/aten::transpose/ScatterElementsUpdate_2" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="10737" name="__module.model.layers.45.self_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7632"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10738" name="__module.model.layers.45.self_attn/aten::cat/Concat_3" type="Concat" version="opset1"> + <data axis="-2" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="present.45.value"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10739" name="__module.model.layers.45.self_attn/aten::unsqueeze/Unsqueeze_3" type="Unsqueeze" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="FP32" names="7694,7695,7696"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10740" name="__module.model.layers.45.self_attn/aten::size/ShapeOf_10" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="10741" name="Constant_302355" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10742" name="__module.model.layers.45.self_attn/aten::size/Constant_11" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="10743" name="__module.model.layers.45.self_attn/aten::size/Gather_11" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="7688"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10744" name="Constant_269472" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="795420624" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10745" name="Constant_277776" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795420632" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="10746" name="Constant_277777" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="10747" name="Gather_277778" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="10748" name="__module.model.layers.45.self_attn/prim::ListConstruct/Concat_5" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="4" precision="I64" names="7697"> + <dim>5</dim> + </port> + </output> + </layer> + <layer id="10749" name="__module.model.layers.45.self_attn/aten::expand/Broadcast_1" type="Broadcast" version="opset3"> + <data mode="bidirectional" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>5</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7698,hidden_states.1365"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10750" name="Constant_301971" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420648" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="10751" name="__module.model.layers.45.self_attn/aten::reshape/Reshape_1" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7702"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10752" name="__module.model.layers.45.self_attn/aten::slice/Reshape_60" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10753" name="ShapeOf_301450" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="10754" name="Constant_301451" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694668" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10755" name="Constant_301452" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="10756" name="Gather_301453" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10757" name="ShapeOf_301454" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="10758" name="Constant_301455" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694668" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10759" name="Constant_301456" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="10760" name="Gather_301457" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10761" name="Add_301458" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64" names="7703"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10762" name="__module.model.layers.45.self_attn/aten::slice/Reshape_62" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10763" name="__module.model.layers.45.self_attn/aten::slice/Reshape_63" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10764" name="__module.model.layers.45.self_attn/aten::slice/Slice_15" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="7707"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="10765" name="__module.model.layers.45.self_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> + <data causal="false" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="7708,attn_output.181"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10766" name="__module.model.layers.45.self_attn/aten::transpose/ScatterElementsUpdate_3" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="10767" name="__module.model.layers.45.self_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7709"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10768" name="Constant_301972" type="Const" version="opset1"> + <data element_type="i64" shape="3" offset="798146608" size="24" /> + <output> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="10769" name="__module.model.layers.45.self_attn/aten::view/Reshape_3" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>3</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7712"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="10770" name="self.model.layers.45.self_attn.o_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 128" offset="7235707000" size="13107200" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10771" name="Convert_386937" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10772" name="self.model.layers.45.self_attn.o_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 1" offset="7248814200" size="102400" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10773" name="Convert_386939" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10774" name="self.model.layers.45.self_attn.o_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10775" name="self.model.layers.45.self_attn.o_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="5120, 40, 1" offset="7248916600" size="409600" /> + <output> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10776" name="self.model.layers.45.self_attn.o_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10777" name="Constant_386944" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="792684080" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="10778" name="Reshape_386945" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="10779" name="__module.model.layers.45.self_attn.o_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="10780" name="__module.model.layers.45.self_attn.o_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7714,7716,hidden_states.1367"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="10781" name="__module.model.layers.45/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7719,7721,7732,hidden_states.1369,hidden_states.1371"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="10782" name="Constant_290507" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 5120" offset="7249326200" size="20480" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="10783" name="Constant_290506" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064860" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10784" name="Constant_290504" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064864" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10785" name="__module.model.layers.45.post_attention_layernorm/aten::pow/Power" type="Power" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7722"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="10786" name="Constant_31364" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64" names="7723"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10787" name="__module.model.layers.45.post_attention_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> + <data keep_dims="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7724,variance.183"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10788" name="Constant_290505" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064876" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10789" name="__module.model.layers.45.post_attention_layernorm/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7725"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10790" name="__module.model.layers.45.post_attention_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10791" name="__module.model.layers.45.post_attention_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7726"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10792" name="__module.model.layers.45.post_attention_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7727,7728,hidden_states.1373,hidden_states.1375"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="10793" name="__module.model.layers.45.post_attention_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7729,7731"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="10794" name="self.model.layers.45.mlp.gate_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 128" offset="7249346680" size="35389440" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10795" name="Convert_385947" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10796" name="self.model.layers.45.mlp.gate_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 1" offset="7284736120" size="276480" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10797" name="Convert_385949" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10798" name="self.model.layers.45.mlp.gate_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10799" name="self.model.layers.45.mlp.gate_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="13824, 40, 1" offset="7285012600" size="1105920" /> + <output> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10800" name="self.model.layers.45.mlp.gate_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10801" name="Constant_385954" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="848558152" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="10802" name="Reshape_385955" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="10803" name="__module.model.layers.45.mlp.gate_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="10804" name="__module.model.layers.45.mlp.gate_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7737,input.91"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="10805" name="__module.model.layers.45.mlp.act_fn/aten::silu/Swish" type="Swish" version="opset4"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="7738"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="10806" name="self.model.layers.45.mlp.up_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 128" offset="7286118520" size="35389440" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10807" name="Convert_385937" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10808" name="self.model.layers.45.mlp.up_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 1" offset="7321507960" size="276480" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10809" name="Convert_385939" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10810" name="self.model.layers.45.mlp.up_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10811" name="self.model.layers.45.mlp.up_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="13824, 40, 1" offset="7321784440" size="1105920" /> + <output> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10812" name="self.model.layers.45.mlp.up_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10813" name="Constant_385944" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="848558152" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="10814" name="Reshape_385945" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="10815" name="__module.model.layers.45.mlp.up_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="10816" name="__module.model.layers.45.mlp.up_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7740"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="10817" name="__module.model.layers.45.mlp/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7741"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="10818" name="self.model.layers.45.mlp.down_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 108, 128" offset="7322890360" size="35389440" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10819" name="Convert_385957" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10820" name="self.model.layers.45.mlp.down_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 108, 1" offset="7358279800" size="276480" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10821" name="Convert_385959" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10822" name="self.model.layers.45.mlp.down_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10823" name="self.model.layers.45.mlp.down_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="5120, 108, 1" offset="7358556280" size="1105920" /> + <output> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10824" name="self.model.layers.45.mlp.down_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10825" name="Constant_385964" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="922101848" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="10826" name="Reshape_385965" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="10827" name="__module.model.layers.45.mlp.down_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="10828" name="__module.model.layers.45.mlp.down_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7743,hidden_states.1377"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="10829" name="__module.model.layers.45/aten::add/Add_1" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7744,7746,7754,7765,hidden_states.1379,hidden_states.1381"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="10830" name="Constant_290511" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 5120" offset="7359662200" size="20480" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="10831" name="Constant_290510" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064860" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10832" name="Constant_290508" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064864" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10833" name="__module.model.layers.46.input_layernorm/aten::pow/Power" type="Power" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7755"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="10834" name="Constant_31438" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64" names="7756"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10835" name="__module.model.layers.46.input_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> + <data keep_dims="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7757,variance.185"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10836" name="Constant_290509" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064876" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10837" name="__module.model.layers.46.input_layernorm/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7758"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10838" name="__module.model.layers.46.input_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10839" name="__module.model.layers.46.input_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7759"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10840" name="__module.model.layers.46.input_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7760,7761,hidden_states.1383,hidden_states.1385"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="10841" name="__module.model.layers.46.input_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7762,7764,hidden_states.1387"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="10842" name="self.model.layers.46.self_attn.q_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 128" offset="7359682680" size="13107200" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10843" name="Convert_386947" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10844" name="self.model.layers.46.self_attn.q_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 1" offset="7372789880" size="102400" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10845" name="Convert_386949" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10846" name="self.model.layers.46.self_attn.q_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10847" name="self.model.layers.46.self_attn.q_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="5120, 40, 1" offset="7372892280" size="409600" /> + <output> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10848" name="self.model.layers.46.self_attn.q_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10849" name="Constant_386954" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="792684080" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="10850" name="Reshape_386955" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="10851" name="__module.model.layers.46.self_attn.q_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="10852" name="__module.model.layers.46.self_attn.q_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="10853" name="self.model.layers.46.self_attn.q_proj.bias" type="Const" version="opset1"> + <data element_type="bf16" shape="5120" offset="7373301880" size="10240" /> + <output> + <port id="0" precision="BF16" names="self.model.layers.46.self_attn.q_proj.bias"> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="10854" name="__module.model.layers.46.self_attn.q_proj/prim::PythonOp/ConvertLike_1" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="BF16"> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="10855" name="__module.model.layers.46.self_attn.q_proj/prim::PythonOp/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7774,query_states.93"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="10856" name="Constant_301973" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="792694336" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="10857" name="__module.model.layers.46.self_attn/aten::view/Reshape" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7782"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10858" name="__module.model.layers.46.self_attn/aten::transpose/ScatterElementsUpdate" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="10859" name="__module.model.layers.46.self_attn/aten::transpose/Transpose" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7783,q.93"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10860" name="__module.model.layers.46.self_attn/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7792"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10861" name="__module.model.layers.46.self_attn/aten::size/ShapeOf_3" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="10862" name="__module.model.layers.46.self_attn/aten::size/Constant_3" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="10863" name="__module.model.layers.46.self_attn/aten::size/Gather_3" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="7793,7798" /> + </output> + </layer> + <layer id="10864" name="__module.model.layers.46.self_attn/aten::floor_divide/Divide_1" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" /> + </output> + </layer> + <layer id="10865" name="__module.model.layers.46.self_attn/aten::floor_divide/Floor_1" type="Floor" version="opset1"> + <input> + <port id="0" precision="I64" /> + </input> + <output> + <port id="1" precision="I64" names="7795,7796,7800,7801" /> + </output> + </layer> + <layer id="10866" name="Constant_221235" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10867" name="__module.model.layers.46.self_attn/aten::slice/Reshape_5" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10868" name="__module.model.layers.46.self_attn/aten::slice/Reshape_1" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694676" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10869" name="__module.model.layers.46.self_attn/aten::slice/Reshape_2" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10870" name="__module.model.layers.46.self_attn/aten::slice/Reshape_3" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10871" name="__module.model.layers.46.self_attn/aten::slice/Slice" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="7802,x2.185"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="10872" name="Constant_290512" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1, 1" offset="792694684" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10873" name="__module.model.layers.46.self_attn/aten::neg/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7803"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="10874" name="__module.model.layers.46.self_attn/aten::slice/Reshape_4" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10875" name="__module.model.layers.46.self_attn/aten::slice/Reshape_6" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10876" name="__module.model.layers.46.self_attn/aten::slice/Reshape_7" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10877" name="__module.model.layers.46.self_attn/aten::slice/Slice_1" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="7797"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="10878" name="__module.model.layers.46.self_attn/aten::cat/Concat" type="Concat" version="opset1"> + <data axis="-1" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7805"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10879" name="__module.model.layers.46.self_attn/aten::mul/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7806"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10880" name="__module.model.layers.46.self_attn/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7807"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10881" name="Constant_341971" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="10882" name="Constant_341964" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="12" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10883" name="Constant_341966" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10884" name="Constant_341968" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="20" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10885" name="Concat_341969" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="10886" name="Broadcast_341972" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32" /> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10887" name="ReadValue_333240" type="ReadValue" version="opset6"> + <data variable_id="past_key_values.46.keypresent.46.key" variable_type="f32" variable_shape="?,8,?,128" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="past_key_values.46.key"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10888" name="Constant_325585" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="10889" name="Gather_325586" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10890" name="self.model.layers.46.self_attn.k_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 128" offset="7373312120" size="2621440" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10891" name="Convert_387907" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10892" name="self.model.layers.46.self_attn.k_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 1" offset="7375933560" size="20480" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10893" name="Convert_387909" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10894" name="self.model.layers.46.self_attn.k_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10895" name="self.model.layers.46.self_attn.k_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="1024, 40, 1" offset="7375954040" size="81920" /> + <output> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10896" name="self.model.layers.46.self_attn.k_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10897" name="Constant_387914" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795418528" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="10898" name="Reshape_387915" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="10899" name="__module.model.layers.46.self_attn.k_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="10900" name="__module.model.layers.46.self_attn.k_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="10901" name="self.model.layers.46.self_attn.k_proj.bias" type="Const" version="opset1"> + <data element_type="bf16" shape="1024" offset="7376035960" size="2048" /> + <output> + <port id="0" precision="BF16" names="self.model.layers.46.self_attn.k_proj.bias"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="10902" name="__module.model.layers.46.self_attn.k_proj/prim::PythonOp/ConvertLike_1" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="BF16"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="10903" name="__module.model.layers.46.self_attn.k_proj/prim::PythonOp/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7777,key_states.189"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="10904" name="Constant_301974" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420592" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="10905" name="__module.model.layers.46.self_attn/aten::view/Reshape_1" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7785"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10906" name="__module.model.layers.46.self_attn/aten::transpose/ScatterElementsUpdate_1" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="10907" name="__module.model.layers.46.self_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7786,k.93"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10908" name="__module.model.layers.46.self_attn/aten::mul/Multiply_2" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7808"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10909" name="__module.model.layers.46.self_attn/aten::size/ShapeOf_5" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="10910" name="__module.model.layers.46.self_attn/aten::size/Constant_5" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="10911" name="__module.model.layers.46.self_attn/aten::size/Gather_5" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="7809,7814" /> + </output> + </layer> + <layer id="10912" name="__module.model.layers.46.self_attn/aten::floor_divide/Divide_3" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" /> + </output> + </layer> + <layer id="10913" name="__module.model.layers.46.self_attn/aten::floor_divide/Floor_3" type="Floor" version="opset1"> + <input> + <port id="0" precision="I64" /> + </input> + <output> + <port id="1" precision="I64" names="7811,7812,7816,7817" /> + </output> + </layer> + <layer id="10914" name="Constant_221236" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10915" name="__module.model.layers.46.self_attn/aten::slice/Reshape_13" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10916" name="__module.model.layers.46.self_attn/aten::slice/Reshape_9" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694676" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10917" name="__module.model.layers.46.self_attn/aten::slice/Reshape_10" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10918" name="__module.model.layers.46.self_attn/aten::slice/Reshape_11" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10919" name="__module.model.layers.46.self_attn/aten::slice/Slice_2" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="7818,x2.187"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="10920" name="Constant_290513" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1, 1" offset="792694684" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10921" name="__module.model.layers.46.self_attn/aten::neg/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7819"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="10922" name="__module.model.layers.46.self_attn/aten::slice/Reshape_12" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10923" name="__module.model.layers.46.self_attn/aten::slice/Reshape_14" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10924" name="__module.model.layers.46.self_attn/aten::slice/Reshape_15" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10925" name="__module.model.layers.46.self_attn/aten::slice/Slice_3" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="7813"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="10926" name="__module.model.layers.46.self_attn/aten::cat/Concat_1" type="Concat" version="opset1"> + <data axis="-1" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7821"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10927" name="__module.model.layers.46.self_attn/aten::mul/Multiply_3" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7822"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10928" name="__module.model.layers.46.self_attn/aten::add/Add_1" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7823"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10929" name="__module.model.layers.46.self_attn/aten::cat/Concat_2" type="Concat" version="opset1"> + <data axis="-2" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="present.46.key"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10930" name="__module.model.layers.46.self_attn/aten::unsqueeze/Unsqueeze_2" type="Unsqueeze" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="FP32" names="7835,7836,7837"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10931" name="__module.model.layers.46.self_attn/aten::size/ShapeOf_6" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="10932" name="Constant_302594" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="938477672" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="10933" name="Constant_302595" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="10934" name="Gather_302596" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="10935" name="Constant_269490" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="795420624" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10936" name="Constant_277801" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795420632" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="10937" name="Constant_277802" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="10938" name="Gather_277803" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="10939" name="__module.model.layers.46.self_attn/prim::ListConstruct/Concat_2" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="3" precision="I64" names="7838"> + <dim>5</dim> + </port> + </output> + </layer> + <layer id="10940" name="__module.model.layers.46.self_attn/aten::expand/Broadcast" type="Broadcast" version="opset3"> + <data mode="bidirectional" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>5</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7839,hidden_states.1391"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10941" name="Constant_301975" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420648" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="10942" name="__module.model.layers.46.self_attn/aten::reshape/Reshape" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7843,key_states.191"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10943" name="Constant_341984" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="10944" name="Constant_341977" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="12" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10945" name="Constant_341979" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10946" name="Constant_341981" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="20" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10947" name="Concat_341982" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="10948" name="Broadcast_341985" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32" /> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10949" name="ReadValue_333242" type="ReadValue" version="opset6"> + <data variable_id="past_key_values.46.valuepresent.46.value" variable_type="f32" variable_shape="?,8,?,128" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="past_key_values.46.value"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10950" name="Constant_325588" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="10951" name="Gather_325589" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10952" name="self.model.layers.46.self_attn.v_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 128" offset="7376038008" size="2621440" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10953" name="Convert_387917" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10954" name="self.model.layers.46.self_attn.v_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 1" offset="7378659448" size="20480" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10955" name="Convert_387919" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10956" name="self.model.layers.46.self_attn.v_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10957" name="self.model.layers.46.self_attn.v_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="1024, 40, 1" offset="7378679928" size="81920" /> + <output> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10958" name="self.model.layers.46.self_attn.v_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10959" name="Constant_387924" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795418528" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="10960" name="Reshape_387925" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="10961" name="__module.model.layers.46.self_attn.v_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="10962" name="__module.model.layers.46.self_attn.v_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="10963" name="self.model.layers.46.self_attn.v_proj.bias" type="Const" version="opset1"> + <data element_type="bf16" shape="1024" offset="7378761848" size="2048" /> + <output> + <port id="0" precision="BF16" names="self.model.layers.46.self_attn.v_proj.bias"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="10964" name="__module.model.layers.46.self_attn.v_proj/prim::PythonOp/ConvertLike_1" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="BF16"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="10965" name="__module.model.layers.46.self_attn.v_proj/prim::PythonOp/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7780,value_states.93"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="10966" name="Constant_301976" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420592" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="10967" name="__module.model.layers.46.self_attn/aten::view/Reshape_2" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7788"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10968" name="__module.model.layers.46.self_attn/aten::transpose/ScatterElementsUpdate_2" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="10969" name="__module.model.layers.46.self_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7789"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10970" name="__module.model.layers.46.self_attn/aten::cat/Concat_3" type="Concat" version="opset1"> + <data axis="-2" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="present.46.value"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10971" name="__module.model.layers.46.self_attn/aten::unsqueeze/Unsqueeze_3" type="Unsqueeze" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="FP32" names="7851,7852,7853"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10972" name="__module.model.layers.46.self_attn/aten::size/ShapeOf_10" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="10973" name="Constant_302361" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10974" name="__module.model.layers.46.self_attn/aten::size/Constant_11" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="10975" name="__module.model.layers.46.self_attn/aten::size/Gather_11" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="7845"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10976" name="Constant_269508" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="795420624" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10977" name="Constant_277811" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795420632" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="10978" name="Constant_277812" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="10979" name="Gather_277813" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="10980" name="__module.model.layers.46.self_attn/prim::ListConstruct/Concat_5" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="4" precision="I64" names="7854"> + <dim>5</dim> + </port> + </output> + </layer> + <layer id="10981" name="__module.model.layers.46.self_attn/aten::expand/Broadcast_1" type="Broadcast" version="opset3"> + <data mode="bidirectional" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>5</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7855,hidden_states.1395"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10982" name="Constant_301977" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420648" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="10983" name="__module.model.layers.46.self_attn/aten::reshape/Reshape_1" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7859"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10984" name="__module.model.layers.46.self_attn/aten::slice/Reshape_60" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10985" name="ShapeOf_301536" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="10986" name="Constant_301537" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694668" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10987" name="Constant_301538" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="10988" name="Gather_301539" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10989" name="ShapeOf_301540" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="10990" name="Constant_301541" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694668" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10991" name="Constant_301542" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="10992" name="Gather_301543" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10993" name="Add_301544" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64" names="7860"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10994" name="__module.model.layers.46.self_attn/aten::slice/Reshape_62" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10995" name="__module.model.layers.46.self_attn/aten::slice/Reshape_63" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="10996" name="__module.model.layers.46.self_attn/aten::slice/Slice_15" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="7864"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="10997" name="__module.model.layers.46.self_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> + <data causal="false" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="7865,attn_output.185"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="10998" name="__module.model.layers.46.self_attn/aten::transpose/ScatterElementsUpdate_3" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="10999" name="__module.model.layers.46.self_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7866"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="11000" name="Constant_301978" type="Const" version="opset1"> + <data element_type="i64" shape="3" offset="798146608" size="24" /> + <output> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="11001" name="__module.model.layers.46.self_attn/aten::view/Reshape_3" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>3</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7869"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="11002" name="self.model.layers.46.self_attn.o_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 128" offset="7378763896" size="13107200" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="11003" name="Convert_386957" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="11004" name="self.model.layers.46.self_attn.o_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 1" offset="7391871096" size="102400" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="11005" name="Convert_386959" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="11006" name="self.model.layers.46.self_attn.o_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="11007" name="self.model.layers.46.self_attn.o_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="5120, 40, 1" offset="7391973496" size="409600" /> + <output> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="11008" name="self.model.layers.46.self_attn.o_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="11009" name="Constant_386964" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="792684080" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="11010" name="Reshape_386965" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="11011" name="__module.model.layers.46.self_attn.o_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="11012" name="__module.model.layers.46.self_attn.o_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7871,7873,hidden_states.1397"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="11013" name="__module.model.layers.46/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7876,7878,7889,hidden_states.1399,hidden_states.1401"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="11014" name="Constant_290517" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 5120" offset="7392383096" size="20480" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="11015" name="Constant_290516" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064860" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="11016" name="Constant_290514" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064864" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="11017" name="__module.model.layers.46.post_attention_layernorm/aten::pow/Power" type="Power" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7879"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="11018" name="Constant_32036" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64" names="7880"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="11019" name="__module.model.layers.46.post_attention_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> + <data keep_dims="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7881,variance.187"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="11020" name="Constant_290515" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064876" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="11021" name="__module.model.layers.46.post_attention_layernorm/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7882"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="11022" name="__module.model.layers.46.post_attention_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="11023" name="__module.model.layers.46.post_attention_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7883"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="11024" name="__module.model.layers.46.post_attention_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7884,7885,hidden_states.1403,hidden_states.1405"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="11025" name="__module.model.layers.46.post_attention_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7886,7888"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="11026" name="self.model.layers.46.mlp.gate_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 128" offset="7392403576" size="35389440" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="11027" name="Convert_385977" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="11028" name="self.model.layers.46.mlp.gate_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 1" offset="7427793016" size="276480" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="11029" name="Convert_385979" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="11030" name="self.model.layers.46.mlp.gate_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="11031" name="self.model.layers.46.mlp.gate_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="13824, 40, 1" offset="7428069496" size="1105920" /> + <output> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="11032" name="self.model.layers.46.mlp.gate_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="11033" name="Constant_385984" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="848558152" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="11034" name="Reshape_385985" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="11035" name="__module.model.layers.46.mlp.gate_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="11036" name="__module.model.layers.46.mlp.gate_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7894,input.93"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="11037" name="__module.model.layers.46.mlp.act_fn/aten::silu/Swish" type="Swish" version="opset4"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="7895"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="11038" name="self.model.layers.46.mlp.up_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 128" offset="7429175416" size="35389440" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="11039" name="Convert_385967" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="11040" name="self.model.layers.46.mlp.up_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 1" offset="7464564856" size="276480" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="11041" name="Convert_385969" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="11042" name="self.model.layers.46.mlp.up_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="11043" name="self.model.layers.46.mlp.up_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="13824, 40, 1" offset="7464841336" size="1105920" /> + <output> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="11044" name="self.model.layers.46.mlp.up_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="11045" name="Constant_385974" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="848558152" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="11046" name="Reshape_385975" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="11047" name="__module.model.layers.46.mlp.up_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="11048" name="__module.model.layers.46.mlp.up_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7897"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="11049" name="__module.model.layers.46.mlp/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7898"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="11050" name="self.model.layers.46.mlp.down_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 108, 128" offset="7465947256" size="35389440" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="11051" name="Convert_385987" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="11052" name="self.model.layers.46.mlp.down_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 108, 1" offset="7501336696" size="276480" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="11053" name="Convert_385989" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="11054" name="self.model.layers.46.mlp.down_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="11055" name="self.model.layers.46.mlp.down_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="5120, 108, 1" offset="7501613176" size="1105920" /> + <output> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="11056" name="self.model.layers.46.mlp.down_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="11057" name="Constant_385994" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="922101848" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="11058" name="Reshape_385995" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="11059" name="__module.model.layers.46.mlp.down_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="11060" name="__module.model.layers.46.mlp.down_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7900,hidden_states.1407"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="11061" name="__module.model.layers.46/aten::add/Add_1" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7901,7903,7911,7922,hidden_states.1409,hidden_states.1411"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="11062" name="Constant_290520" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064860" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="11063" name="Constant_290518" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064864" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="11064" name="__module.model.layers.47.input_layernorm/aten::pow/Power" type="Power" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7912"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="11065" name="Constant_32110" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64" names="7913"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="11066" name="__module.model.layers.47.input_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> + <data keep_dims="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7914,variance.189"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="11067" name="Constant_290519" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064876" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="11068" name="__module.model.layers.47.input_layernorm/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7915"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="11069" name="__module.model.layers.47.input_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="11070" name="__module.model.layers.47.input_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7916"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="11071" name="__module.model.layers.47.input_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7917,7918,hidden_states.1413,hidden_states.1415"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="11072" name="__module.model.layers.47.input_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7919,7921,hidden_states.1417"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="11073" name="self.model.layers.47.self_attn.v_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 128" offset="7502719096" size="2621440" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="11074" name="Convert_387927" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="11075" name="self.model.layers.47.self_attn.v_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 1" offset="7505340536" size="20480" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="11076" name="Convert_387929" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="11077" name="self.model.layers.47.self_attn.v_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="11078" name="self.model.layers.47.self_attn.v_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="1024, 40, 1" offset="7505361016" size="81920" /> + <output> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="11079" name="self.model.layers.47.self_attn.v_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="11080" name="Constant_387934" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795418528" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="11081" name="Reshape_387935" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="11082" name="__module.model.layers.47.self_attn.v_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="11083" name="__module.model.layers.47.self_attn.v_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="11084" name="self.model.layers.47.self_attn.v_proj.bias" type="Const" version="opset1"> + <data element_type="bf16" shape="1024" offset="7505442936" size="2048" /> + <output> + <port id="0" precision="BF16" names="self.model.layers.47.self_attn.v_proj.bias"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="11085" name="__module.model.layers.47.self_attn.v_proj/prim::PythonOp/ConvertLike_1" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="BF16"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="11086" name="__module.model.layers.47.self_attn.v_proj/prim::PythonOp/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7937,value_states"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="11087" name="Constant_301979" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420592" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="11088" name="__module.model.layers.47.self_attn/aten::view/Reshape" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7945"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="11089" name="__module.model.layers.47.self_attn/aten::transpose/ScatterElementsUpdate" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="11090" name="__module.model.layers.47.self_attn/aten::transpose/Transpose" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7946"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="11091" name="__module.model.layers.47.self_attn/aten::cat/Concat" type="Concat" version="opset1"> + <data axis="-2" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="present.47.value"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="11093" name="Constant_341997" type="Const" version="opset1"> + <data element_type="f32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="FP32" /> + </output> + </layer> + <layer id="11094" name="Constant_341990" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="12" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="11095" name="Constant_341992" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="11096" name="Constant_341994" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="20" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="11097" name="Concat_341995" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="4" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="11098" name="Broadcast_341998" type="Broadcast" version="opset3"> + <data mode="numpy" /> + <input> + <port id="0" precision="FP32" /> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="11099" name="ReadValue_333244" type="ReadValue" version="opset6"> + <data variable_id="past_key_values.47.keypresent.47.key" variable_type="f32" variable_shape="?,8,?,128" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>0</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="past_key_values.47.key"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="11100" name="Constant_325591" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="11101" name="Gather_325592" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>-1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="11102" name="self.model.layers.47.self_attn.k_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 128" offset="7505444984" size="2621440" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="11103" name="Convert_387937" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="11104" name="self.model.layers.47.self_attn.k_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="1024, 40, 1" offset="7508066424" size="20480" /> + <output> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="11105" name="Convert_387939" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="11106" name="self.model.layers.47.self_attn.k_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="11107" name="self.model.layers.47.self_attn.k_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="1024, 40, 1" offset="7508086904" size="81920" /> + <output> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="11108" name="self.model.layers.47.self_attn.k_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="11109" name="Constant_387944" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795418528" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="11110" name="Reshape_387945" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="11111" name="__module.model.layers.47.self_attn.k_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="11112" name="__module.model.layers.47.self_attn.k_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="11113" name="self.model.layers.47.self_attn.k_proj.bias" type="Const" version="opset1"> + <data element_type="bf16" shape="1024" offset="7508168824" size="2048" /> + <output> + <port id="0" precision="BF16" names="self.model.layers.47.self_attn.k_proj.bias"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="11114" name="__module.model.layers.47.self_attn.k_proj/prim::PythonOp/ConvertLike_1" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="BF16"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="11115" name="__module.model.layers.47.self_attn.k_proj/prim::PythonOp/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="FP32"> + <dim>1024</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7934,key_states.193"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + </output> + </layer> + <layer id="11116" name="Constant_301980" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420592" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="11117" name="__module.model.layers.47.self_attn/aten::view/Reshape_1" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1024</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7942"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="11118" name="__module.model.layers.47.self_attn/aten::transpose/ScatterElementsUpdate_1" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="11119" name="__module.model.layers.47.self_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>8</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7943,k"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="11120" name="__module.model.layers.47.self_attn/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7965"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="11121" name="__module.model.layers.47.self_attn/aten::size/ShapeOf_3" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="11122" name="__module.model.layers.47.self_attn/aten::size/Constant_3" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="11123" name="__module.model.layers.47.self_attn/aten::size/Gather_3" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="7966,7971" /> + </output> + </layer> + <layer id="11124" name="__module.model.layers.47.self_attn/aten::floor_divide/Divide_1" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" /> + </output> + </layer> + <layer id="11125" name="__module.model.layers.47.self_attn/aten::floor_divide/Floor_1" type="Floor" version="opset1"> + <input> + <port id="0" precision="I64" /> + </input> + <output> + <port id="1" precision="I64" names="7968,7969,7973,7974" /> + </output> + </layer> + <layer id="11126" name="Constant_221250" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="11127" name="__module.model.layers.47.self_attn/aten::slice/Reshape_5" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="11128" name="__module.model.layers.47.self_attn/aten::slice/Reshape_1" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694676" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="11129" name="__module.model.layers.47.self_attn/aten::slice/Reshape_2" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="11130" name="__module.model.layers.47.self_attn/aten::slice/Reshape_3" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="11131" name="__module.model.layers.47.self_attn/aten::slice/Slice" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="7975,x2"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="11132" name="Constant_290522" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1, 1" offset="792694684" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="11133" name="__module.model.layers.47.self_attn/aten::neg/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7976"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="11134" name="__module.model.layers.47.self_attn/aten::slice/Reshape_4" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="11135" name="__module.model.layers.47.self_attn/aten::slice/Reshape_6" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="11136" name="__module.model.layers.47.self_attn/aten::slice/Reshape_7" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="11137" name="__module.model.layers.47.self_attn/aten::slice/Slice_1" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="7970"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="11138" name="__module.model.layers.47.self_attn/aten::cat/Concat_1" type="Concat" version="opset1"> + <data axis="-1" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7978"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="11139" name="__module.model.layers.47.self_attn/aten::mul/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7979"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="11140" name="__module.model.layers.47.self_attn/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7980"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="11141" name="__module.model.layers.47.self_attn/aten::cat/Concat_2" type="Concat" version="opset1"> + <data axis="-2" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="present.47.key"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="11227" name="Constant_290531" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 5120" offset="7508170872" size="20480" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="11228" name="self.model.layers.47.self_attn.q_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 128" offset="7508191352" size="13107200" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="11229" name="Convert_386967" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="11230" name="self.model.layers.47.self_attn.q_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 1" offset="7521298552" size="102400" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="11231" name="Convert_386969" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="11232" name="self.model.layers.47.self_attn.q_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="11233" name="self.model.layers.47.self_attn.q_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="5120, 40, 1" offset="7521400952" size="409600" /> + <output> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="11234" name="self.model.layers.47.self_attn.q_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="11235" name="Constant_386974" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="792684080" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="11236" name="Reshape_386975" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="11237" name="__module.model.layers.47.self_attn.q_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="11238" name="__module.model.layers.47.self_attn.q_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="11239" name="self.model.layers.47.self_attn.q_proj.bias" type="Const" version="opset1"> + <data element_type="bf16" shape="5120" offset="7521810552" size="10240" /> + <output> + <port id="0" precision="BF16" names="self.model.layers.47.self_attn.q_proj.bias"> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="11240" name="__module.model.layers.47.self_attn.q_proj/prim::PythonOp/ConvertLike_1" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="BF16"> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="11241" name="__module.model.layers.47.self_attn.q_proj/prim::PythonOp/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7931,query_states"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="11242" name="Constant_301981" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="792694336" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="11243" name="__module.model.layers.47.self_attn/aten::view/Reshape_2" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7939"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="11244" name="__module.model.layers.47.self_attn/aten::transpose/ScatterElementsUpdate_2" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="11245" name="__module.model.layers.47.self_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7940,q"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="11246" name="__module.model.layers.47.self_attn/aten::mul/Multiply_2" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7949"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="11247" name="__module.model.layers.47.self_attn/aten::size/ShapeOf_5" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="11248" name="__module.model.layers.47.self_attn/aten::size/Constant_5" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="11249" name="__module.model.layers.47.self_attn/aten::size/Gather_5" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64" /> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="7950,7955" /> + </output> + </layer> + <layer id="11250" name="__module.model.layers.47.self_attn/aten::floor_divide/Divide_3" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="I64" /> + </output> + </layer> + <layer id="11251" name="__module.model.layers.47.self_attn/aten::floor_divide/Floor_3" type="Floor" version="opset1"> + <input> + <port id="0" precision="I64" /> + </input> + <output> + <port id="1" precision="I64" names="7952,7953,7957,7958" /> + </output> + </layer> + <layer id="11252" name="Constant_221251" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="11253" name="__module.model.layers.47.self_attn/aten::slice/Reshape_13" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="I64" /> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="11254" name="__module.model.layers.47.self_attn/aten::slice/Reshape_9" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694676" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="11255" name="__module.model.layers.47.self_attn/aten::slice/Reshape_10" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="11256" name="__module.model.layers.47.self_attn/aten::slice/Reshape_11" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="11257" name="__module.model.layers.47.self_attn/aten::slice/Slice_2" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="7959,x2.189"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="11258" name="Constant_290523" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1, 1" offset="792694684" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="11259" name="__module.model.layers.47.self_attn/aten::neg/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7960"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="11260" name="__module.model.layers.47.self_attn/aten::slice/Reshape_12" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="11261" name="__module.model.layers.47.self_attn/aten::slice/Reshape_14" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="11262" name="__module.model.layers.47.self_attn/aten::slice/Reshape_15" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="11263" name="__module.model.layers.47.self_attn/aten::slice/Slice_3" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="7954"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </output> + </layer> + <layer id="11264" name="__module.model.layers.47.self_attn/aten::cat/Concat_3" type="Concat" version="opset1"> + <data axis="-1" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>64</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7962"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="11265" name="__module.model.layers.47.self_attn/aten::mul/Multiply_3" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7963"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="11266" name="__module.model.layers.47.self_attn/aten::add/Add_1" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7964"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="11267" name="__module.model.layers.47.self_attn/aten::unsqueeze/Unsqueeze_2" type="Unsqueeze" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="FP32" names="7992,7993,7994"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="11268" name="__module.model.layers.47.self_attn/aten::size/ShapeOf_6" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="11269" name="Constant_302599" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="938477672" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="11270" name="Constant_302600" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="11271" name="Gather_302601" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="11272" name="Constant_269526" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="795420624" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="11273" name="Constant_277836" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795420632" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="11274" name="Constant_277837" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="11275" name="Gather_277838" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="11276" name="__module.model.layers.47.self_attn/prim::ListConstruct/Concat_3" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="3" precision="I64" names="7995"> + <dim>5</dim> + </port> + </output> + </layer> + <layer id="11277" name="__module.model.layers.47.self_attn/aten::expand/Broadcast" type="Broadcast" version="opset3"> + <data mode="bidirectional" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>5</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="7996,hidden_states.1421"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="11278" name="Constant_301982" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420648" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="11279" name="__module.model.layers.47.self_attn/aten::reshape/Reshape" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="8000,key_states"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="11280" name="__module.model.layers.47.self_attn/aten::unsqueeze/Unsqueeze_3" type="Unsqueeze" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64" /> + </input> + <output> + <port id="2" precision="FP32" names="8008,8009,8010"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="11281" name="__module.model.layers.47.self_attn/aten::size/ShapeOf_10" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="11282" name="Constant_302367" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="11283" name="__module.model.layers.47.self_attn/aten::size/Constant_11" type="Const" version="opset1"> + <data element_type="i32" shape="" offset="0" size="4" /> + <output> + <port id="0" precision="I32" /> + </output> + </layer> + <layer id="11284" name="__module.model.layers.47.self_attn/aten::size/Gather_11" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I32" /> + </input> + <output> + <port id="3" precision="I64" names="8002"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="11285" name="Constant_269544" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="795420624" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="11286" name="Constant_277846" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="795420632" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="11287" name="Constant_277847" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="11288" name="Gather_277848" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="11289" name="__module.model.layers.47.self_attn/prim::ListConstruct/Concat_5" type="Concat" version="opset1"> + <data axis="0" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="4" precision="I64" names="8011"> + <dim>5</dim> + </port> + </output> + </layer> + <layer id="11290" name="__module.model.layers.47.self_attn/aten::expand/Broadcast_1" type="Broadcast" version="opset3"> + <data mode="bidirectional" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>5</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="8012,hidden_states.1425"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="11291" name="Constant_301983" type="Const" version="opset1"> + <data element_type="i64" shape="4" offset="795420648" size="32" /> + <output> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="11292" name="__module.model.layers.47.self_attn/aten::reshape/Reshape_1" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>5</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="8016"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="11293" name="__module.model.layers.47.self_attn/aten::slice/Reshape_60" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="4" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="11294" name="ShapeOf_301622" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="11295" name="Constant_301623" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694668" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="11296" name="Constant_301624" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="11297" name="Gather_301625" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="11298" name="ShapeOf_301626" type="ShapeOf" version="opset3"> + <data output_type="i64" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="I64"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="11299" name="Constant_301627" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694668" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="11300" name="Constant_301628" type="Const" version="opset1"> + <data element_type="i64" shape="" offset="4" size="8" /> + <output> + <port id="0" precision="I64" /> + </output> + </layer> + <layer id="11301" name="Gather_301629" type="Gather" version="opset8"> + <data batch_dims="0" /> + <input> + <port id="0" precision="I64"> + <dim>4</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64" /> + </input> + <output> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="11302" name="Add_301630" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="I64" names="8017"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="11303" name="__module.model.layers.47.self_attn/aten::slice/Reshape_62" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694640" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="11304" name="__module.model.layers.47.self_attn/aten::slice/Reshape_63" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="792694660" size="8" /> + <output> + <port id="0" precision="I64"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="11305" name="__module.model.layers.47.self_attn/aten::slice/Slice_15" type="Slice" version="opset8"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + <port id="2" precision="I64"> + <dim>1</dim> + </port> + <port id="3" precision="I64"> + <dim>1</dim> + </port> + <port id="4" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="5" precision="FP32" names="8021"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </output> + </layer> + <layer id="11306" name="__module.model.layers.47.self_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> + <data causal="false" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="2" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="3" precision="FP32"> + <dim>-1</dim> + <dim>1</dim> + <dim>-1</dim> + <dim>-1</dim> + </port> + </input> + <output> + <port id="4" precision="FP32" names="8022,attn_output.189"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="11307" name="__module.model.layers.47.self_attn/aten::transpose/ScatterElementsUpdate_3" type="Const" version="opset1"> + <data element_type="i32" shape="4" offset="792694368" size="16" /> + <output> + <port id="0" precision="I32"> + <dim>4</dim> + </port> + </output> + </layer> + <layer id="11308" name="__module.model.layers.47.self_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>40</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + <port id="1" precision="I32"> + <dim>4</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="8023"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="11309" name="Constant_301984" type="Const" version="opset1"> + <data element_type="i64" shape="3" offset="798146608" size="24" /> + <output> + <port id="0" precision="I64"> + <dim>3</dim> + </port> + </output> + </layer> + <layer id="11310" name="__module.model.layers.47.self_attn/aten::view/Reshape_3" type="Reshape" version="opset1"> + <data special_zero="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>3</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="8026"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="11311" name="self.model.layers.47.self_attn.o_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 128" offset="7521820792" size="13107200" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="11312" name="Convert_386977" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="11313" name="self.model.layers.47.self_attn.o_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 40, 1" offset="7534927992" size="102400" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="11314" name="Convert_386979" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="11315" name="self.model.layers.47.self_attn.o_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="11316" name="self.model.layers.47.self_attn.o_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="5120, 40, 1" offset="7535030392" size="409600" /> + <output> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="11317" name="self.model.layers.47.self_attn.o_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="11318" name="Constant_386984" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="792684080" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="11319" name="Reshape_386985" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="11320" name="__module.model.layers.47.self_attn.o_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="11321" name="__module.model.layers.47.self_attn.o_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="8028,8030,hidden_states.1427"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="11322" name="__module.model.layers.47/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="8033,8035,8046,hidden_states.1429,hidden_states.1431"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="11323" name="Constant_290527" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 5120" offset="7535439992" size="20480" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="11324" name="Constant_290526" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064860" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="11325" name="Constant_290524" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064864" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="11326" name="__module.model.layers.47.post_attention_layernorm/aten::pow/Power" type="Power" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="8036"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="11327" name="Constant_32708" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64" names="8037"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="11328" name="__module.model.layers.47.post_attention_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> + <data keep_dims="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="8038,variance.191"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="11329" name="Constant_290525" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064876" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="11330" name="__module.model.layers.47.post_attention_layernorm/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="8039"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="11331" name="__module.model.layers.47.post_attention_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="11332" name="__module.model.layers.47.post_attention_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="8040"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="11333" name="__module.model.layers.47.post_attention_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="8041,8042,hidden_states.1433,hidden_states.1435"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="11334" name="__module.model.layers.47.post_attention_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="8043,8045"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="11335" name="self.model.layers.47.mlp.gate_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 128" offset="7535460472" size="35389440" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="11336" name="Convert_386007" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="11337" name="self.model.layers.47.mlp.gate_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 1" offset="7570849912" size="276480" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="11338" name="Convert_386009" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="11339" name="self.model.layers.47.mlp.gate_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="11340" name="self.model.layers.47.mlp.gate_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="13824, 40, 1" offset="7571126392" size="1105920" /> + <output> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="11341" name="self.model.layers.47.mlp.gate_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="11342" name="Constant_386014" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="848558152" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="11343" name="Reshape_386015" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="11344" name="__module.model.layers.47.mlp.gate_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="11345" name="__module.model.layers.47.mlp.gate_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="8051,input"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="11346" name="__module.model.layers.47.mlp.act_fn/aten::silu/Swish" type="Swish" version="opset4"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="1" precision="FP32" names="8052"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="11347" name="self.model.layers.47.mlp.up_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 128" offset="7572232312" size="35389440" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="11348" name="Convert_385997" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="11349" name="self.model.layers.47.mlp.up_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="13824, 40, 1" offset="7607621752" size="276480" /> + <output> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="11350" name="Convert_385999" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="11351" name="self.model.layers.47.mlp.up_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="11352" name="self.model.layers.47.mlp.up_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="13824, 40, 1" offset="7607898232" size="1105920" /> + <output> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="11353" name="self.model.layers.47.mlp.up_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="11354" name="Constant_386004" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="848558152" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="11355" name="Reshape_386005" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>40</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="11356" name="__module.model.layers.47.mlp.up_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="11357" name="__module.model.layers.47.mlp.up_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>13824</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="8054"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="11358" name="__module.model.layers.47.mlp/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="8055"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="11359" name="self.model.layers.47.mlp.down_proj.weight" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 108, 128" offset="7609004152" size="35389440" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="11360" name="Convert_386017" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="11361" name="self.model.layers.47.mlp.down_proj.weight/zero_point" type="Const" version="opset1"> + <data element_type="u4" shape="5120, 108, 1" offset="7644393592" size="276480" /> + <output> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="11362" name="Convert_386019" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U4"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="11363" name="self.model.layers.47.mlp.down_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="11364" name="self.model.layers.47.mlp.down_proj.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="5120, 108, 1" offset="7644670072" size="1105920" /> + <output> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="11365" name="self.model.layers.47.mlp.down_proj.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + <port id="1" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="11366" name="Constant_386024" type="Const" version="opset1"> + <data element_type="i64" shape="2" offset="922101848" size="16" /> + <output> + <port id="0" precision="I64"> + <dim>2</dim> + </port> + </output> + </layer> + <layer id="11367" name="Reshape_386025" type="Reshape" version="opset1"> + <data special_zero="false" /> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>108</dim> + <dim>128</dim> + </port> + <port id="1" precision="I64"> + <dim>2</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="11368" name="__module.model.layers.47.mlp.down_proj/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </output> + </layer> + <layer id="11369" name="__module.model.layers.47.mlp.down_proj/prim::PythonOp/MatMul" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>13824</dim> + </port> + <port id="1" precision="FP32"> + <dim>5120</dim> + <dim>13824</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="8057,hidden_states.1437"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="11370" name="__module.model.layers.47/aten::add/Add_1" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="8058,8060,8064,hidden_states.1439,hidden_states.1441"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="11371" name="Constant_290530" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064860" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="11372" name="Constant_290528" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064864" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="11373" name="__module.model.norm/aten::pow/Power" type="Power" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="8065"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="11374" name="Constant_32778" type="Const" version="opset1"> + <data element_type="i64" shape="1" offset="779064868" size="8" /> + <output> + <port id="0" precision="I64" names="8066"> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="11375" name="__module.model.norm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> + <data keep_dims="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="I64"> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="8067,variance"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="11376" name="Constant_290529" type="Const" version="opset1"> + <data element_type="f32" shape="1, 1, 1" offset="779064876" size="4" /> + <output> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="11377" name="__module.model.norm/aten::add/Add" type="Add" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="8068"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="11378" name="__module.model.norm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="11379" name="__module.model.norm/aten::rsqrt/Divide" type="Divide" version="opset1"> + <data auto_broadcast="numpy" m_pythondiv="true" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>1</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="8069"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="11380" name="__module.model.norm/aten::mul/Multiply" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="8070,8071,hidden_states.1443,hidden_states.1445"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="11381" name="__module.model.norm/aten::mul/Multiply_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP32"> + <dim>1</dim> + <dim>1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="152,253,258,263,8072,hidden_states"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="11382" name="self.lm_head.weight" type="Const" version="opset1"> + <data element_type="u8" shape="152064, 5120" offset="7645775992" size="778567680" /> + <output> + <port id="0" precision="U8"> + <dim>152064</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="11383" name="Convert_384578" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>152064</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>152064</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="11384" name="self.lm_head.weight/zero_point" type="Const" version="opset1"> + <data element_type="u8" shape="152064, 1" offset="8424343672" size="152064" /> + <output> + <port id="0" precision="U8"> + <dim>152064</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="11385" name="Convert_384581" type="Convert" version="opset1"> + <data destination_type="f16" /> + <input> + <port id="0" precision="U8"> + <dim>152064</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="1" precision="FP16"> + <dim>152064</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="11386" name="self.lm_head.weight/zero_point/subtract" type="Subtract" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>152064</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP16"> + <dim>152064</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>152064</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="11387" name="self.lm_head.weight/scale" type="Const" version="opset1"> + <data element_type="f16" shape="152064, 1" offset="8424495736" size="304128" /> + <output> + <port id="0" precision="FP16"> + <dim>152064</dim> + <dim>1</dim> + </port> + </output> + </layer> + <layer id="11388" name="self.lm_head.weight/fq_weights_1" type="Multiply" version="opset1"> + <data auto_broadcast="numpy" /> + <input> + <port id="0" precision="FP16"> + <dim>152064</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP16"> + <dim>152064</dim> + <dim>1</dim> + </port> + </input> + <output> + <port id="2" precision="FP16"> + <dim>152064</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="11389" name="__module.lm_head/prim::PythonOp/ConvertLike" type="Convert" version="opset1"> + <data destination_type="f32" /> + <rt_info> + <attribute name="decompression" version="0" /> + </rt_info> + <input> + <port id="0" precision="FP16"> + <dim>152064</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>152064</dim> + <dim>5120</dim> + </port> + </output> + </layer> + <layer id="11390" name="aten::to/Convert" type="MatMul" version="opset1"> + <data transpose_a="false" transpose_b="true" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>5120</dim> + </port> + <port id="1" precision="FP32"> + <dim>152064</dim> + <dim>5120</dim> + </port> + </input> + <output> + <port id="2" precision="FP32" names="logits"> + <dim>-1</dim> + <dim>-1</dim> + <dim>152064</dim> + </port> + </output> + </layer> + <layer id="11226" name="Assign_333077" type="Assign" version="opset6"> + <data variable_id="past_key_values.0.keypresent.0.key" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="11225" name="Assign_333079" type="Assign" version="opset6"> + <data variable_id="past_key_values.0.valuepresent.0.value" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="11224" name="Assign_333081" type="Assign" version="opset6"> + <data variable_id="past_key_values.1.keypresent.1.key" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="11223" name="Assign_333083" type="Assign" version="opset6"> + <data variable_id="past_key_values.1.valuepresent.1.value" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="11222" name="Assign_333085" type="Assign" version="opset6"> + <data variable_id="past_key_values.10.keypresent.10.key" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="11221" name="Assign_333087" type="Assign" version="opset6"> + <data variable_id="past_key_values.10.valuepresent.10.value" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="11220" name="Assign_333089" type="Assign" version="opset6"> + <data variable_id="past_key_values.11.keypresent.11.key" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="11219" name="Assign_333091" type="Assign" version="opset6"> + <data variable_id="past_key_values.11.valuepresent.11.value" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="11218" name="Assign_333093" type="Assign" version="opset6"> + <data variable_id="past_key_values.12.keypresent.12.key" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="11217" name="Assign_333095" type="Assign" version="opset6"> + <data variable_id="past_key_values.12.valuepresent.12.value" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="11216" name="Assign_333097" type="Assign" version="opset6"> + <data variable_id="past_key_values.13.keypresent.13.key" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="11215" name="Assign_333099" type="Assign" version="opset6"> + <data variable_id="past_key_values.13.valuepresent.13.value" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="11214" name="Assign_333101" type="Assign" version="opset6"> + <data variable_id="past_key_values.14.keypresent.14.key" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="11213" name="Assign_333103" type="Assign" version="opset6"> + <data variable_id="past_key_values.14.valuepresent.14.value" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="11212" name="Assign_333105" type="Assign" version="opset6"> + <data variable_id="past_key_values.15.keypresent.15.key" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="11211" name="Assign_333107" type="Assign" version="opset6"> + <data variable_id="past_key_values.15.valuepresent.15.value" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="11210" name="Assign_333109" type="Assign" version="opset6"> + <data variable_id="past_key_values.16.keypresent.16.key" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="11209" name="Assign_333111" type="Assign" version="opset6"> + <data variable_id="past_key_values.16.valuepresent.16.value" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="11208" name="Assign_333113" type="Assign" version="opset6"> + <data variable_id="past_key_values.17.keypresent.17.key" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="11207" name="Assign_333115" type="Assign" version="opset6"> + <data variable_id="past_key_values.17.valuepresent.17.value" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="11206" name="Assign_333117" type="Assign" version="opset6"> + <data variable_id="past_key_values.18.keypresent.18.key" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="11205" name="Assign_333119" type="Assign" version="opset6"> + <data variable_id="past_key_values.18.valuepresent.18.value" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="11204" name="Assign_333121" type="Assign" version="opset6"> + <data variable_id="past_key_values.19.keypresent.19.key" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="11203" name="Assign_333123" type="Assign" version="opset6"> + <data variable_id="past_key_values.19.valuepresent.19.value" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="11202" name="Assign_333125" type="Assign" version="opset6"> + <data variable_id="past_key_values.2.keypresent.2.key" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="11201" name="Assign_333127" type="Assign" version="opset6"> + <data variable_id="past_key_values.2.valuepresent.2.value" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="11200" name="Assign_333129" type="Assign" version="opset6"> + <data variable_id="past_key_values.20.keypresent.20.key" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="11199" name="Assign_333131" type="Assign" version="opset6"> + <data variable_id="past_key_values.20.valuepresent.20.value" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="11198" name="Assign_333133" type="Assign" version="opset6"> + <data variable_id="past_key_values.21.keypresent.21.key" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="11197" name="Assign_333135" type="Assign" version="opset6"> + <data variable_id="past_key_values.21.valuepresent.21.value" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="11196" name="Assign_333137" type="Assign" version="opset6"> + <data variable_id="past_key_values.22.keypresent.22.key" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="11195" name="Assign_333139" type="Assign" version="opset6"> + <data variable_id="past_key_values.22.valuepresent.22.value" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="11194" name="Assign_333141" type="Assign" version="opset6"> + <data variable_id="past_key_values.23.keypresent.23.key" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="11193" name="Assign_333143" type="Assign" version="opset6"> + <data variable_id="past_key_values.23.valuepresent.23.value" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="11192" name="Assign_333145" type="Assign" version="opset6"> + <data variable_id="past_key_values.24.keypresent.24.key" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="11191" name="Assign_333147" type="Assign" version="opset6"> + <data variable_id="past_key_values.24.valuepresent.24.value" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="11190" name="Assign_333149" type="Assign" version="opset6"> + <data variable_id="past_key_values.25.keypresent.25.key" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="11189" name="Assign_333151" type="Assign" version="opset6"> + <data variable_id="past_key_values.25.valuepresent.25.value" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="11188" name="Assign_333153" type="Assign" version="opset6"> + <data variable_id="past_key_values.26.keypresent.26.key" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="11187" name="Assign_333155" type="Assign" version="opset6"> + <data variable_id="past_key_values.26.valuepresent.26.value" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="11186" name="Assign_333157" type="Assign" version="opset6"> + <data variable_id="past_key_values.27.keypresent.27.key" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="11185" name="Assign_333159" type="Assign" version="opset6"> + <data variable_id="past_key_values.27.valuepresent.27.value" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="11184" name="Assign_333161" type="Assign" version="opset6"> + <data variable_id="past_key_values.28.keypresent.28.key" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="11183" name="Assign_333163" type="Assign" version="opset6"> + <data variable_id="past_key_values.28.valuepresent.28.value" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="11182" name="Assign_333165" type="Assign" version="opset6"> + <data variable_id="past_key_values.29.keypresent.29.key" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="11181" name="Assign_333167" type="Assign" version="opset6"> + <data variable_id="past_key_values.29.valuepresent.29.value" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="11180" name="Assign_333169" type="Assign" version="opset6"> + <data variable_id="past_key_values.3.keypresent.3.key" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="11179" name="Assign_333171" type="Assign" version="opset6"> + <data variable_id="past_key_values.3.valuepresent.3.value" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="11178" name="Assign_333173" type="Assign" version="opset6"> + <data variable_id="past_key_values.30.keypresent.30.key" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="11177" name="Assign_333175" type="Assign" version="opset6"> + <data variable_id="past_key_values.30.valuepresent.30.value" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="11176" name="Assign_333177" type="Assign" version="opset6"> + <data variable_id="past_key_values.31.keypresent.31.key" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="11175" name="Assign_333179" type="Assign" version="opset6"> + <data variable_id="past_key_values.31.valuepresent.31.value" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="11174" name="Assign_333181" type="Assign" version="opset6"> + <data variable_id="past_key_values.32.keypresent.32.key" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="11173" name="Assign_333183" type="Assign" version="opset6"> + <data variable_id="past_key_values.32.valuepresent.32.value" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="11172" name="Assign_333185" type="Assign" version="opset6"> + <data variable_id="past_key_values.33.keypresent.33.key" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="11171" name="Assign_333187" type="Assign" version="opset6"> + <data variable_id="past_key_values.33.valuepresent.33.value" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="11170" name="Assign_333189" type="Assign" version="opset6"> + <data variable_id="past_key_values.34.keypresent.34.key" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="11169" name="Assign_333191" type="Assign" version="opset6"> + <data variable_id="past_key_values.34.valuepresent.34.value" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="11168" name="Assign_333193" type="Assign" version="opset6"> + <data variable_id="past_key_values.35.keypresent.35.key" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="11167" name="Assign_333195" type="Assign" version="opset6"> + <data variable_id="past_key_values.35.valuepresent.35.value" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="11166" name="Assign_333197" type="Assign" version="opset6"> + <data variable_id="past_key_values.36.keypresent.36.key" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="11165" name="Assign_333199" type="Assign" version="opset6"> + <data variable_id="past_key_values.36.valuepresent.36.value" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="11164" name="Assign_333201" type="Assign" version="opset6"> + <data variable_id="past_key_values.37.keypresent.37.key" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="11163" name="Assign_333203" type="Assign" version="opset6"> + <data variable_id="past_key_values.37.valuepresent.37.value" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="11162" name="Assign_333205" type="Assign" version="opset6"> + <data variable_id="past_key_values.38.keypresent.38.key" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="11161" name="Assign_333207" type="Assign" version="opset6"> + <data variable_id="past_key_values.38.valuepresent.38.value" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="11160" name="Assign_333209" type="Assign" version="opset6"> + <data variable_id="past_key_values.39.keypresent.39.key" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="11159" name="Assign_333211" type="Assign" version="opset6"> + <data variable_id="past_key_values.39.valuepresent.39.value" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="11158" name="Assign_333213" type="Assign" version="opset6"> + <data variable_id="past_key_values.4.keypresent.4.key" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="11157" name="Assign_333215" type="Assign" version="opset6"> + <data variable_id="past_key_values.4.valuepresent.4.value" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="11156" name="Assign_333217" type="Assign" version="opset6"> + <data variable_id="past_key_values.40.keypresent.40.key" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="11155" name="Assign_333219" type="Assign" version="opset6"> + <data variable_id="past_key_values.40.valuepresent.40.value" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="11154" name="Assign_333221" type="Assign" version="opset6"> + <data variable_id="past_key_values.41.keypresent.41.key" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="11153" name="Assign_333223" type="Assign" version="opset6"> + <data variable_id="past_key_values.41.valuepresent.41.value" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="11152" name="Assign_333225" type="Assign" version="opset6"> + <data variable_id="past_key_values.42.keypresent.42.key" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="11151" name="Assign_333227" type="Assign" version="opset6"> + <data variable_id="past_key_values.42.valuepresent.42.value" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="11150" name="Assign_333229" type="Assign" version="opset6"> + <data variable_id="past_key_values.43.keypresent.43.key" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="11149" name="Assign_333231" type="Assign" version="opset6"> + <data variable_id="past_key_values.43.valuepresent.43.value" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="11148" name="Assign_333233" type="Assign" version="opset6"> + <data variable_id="past_key_values.44.keypresent.44.key" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="11147" name="Assign_333235" type="Assign" version="opset6"> + <data variable_id="past_key_values.44.valuepresent.44.value" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="11146" name="Assign_333237" type="Assign" version="opset6"> + <data variable_id="past_key_values.45.keypresent.45.key" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="11145" name="Assign_333239" type="Assign" version="opset6"> + <data variable_id="past_key_values.45.valuepresent.45.value" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="11144" name="Assign_333241" type="Assign" version="opset6"> + <data variable_id="past_key_values.46.keypresent.46.key" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="11143" name="Assign_333243" type="Assign" version="opset6"> + <data variable_id="past_key_values.46.valuepresent.46.value" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="11142" name="Assign_333245" type="Assign" version="opset6"> + <data variable_id="past_key_values.47.keypresent.47.key" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="11092" name="Assign_333247" type="Assign" version="opset6"> + <data variable_id="past_key_values.47.valuepresent.47.value" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2324" name="Assign_333249" type="Assign" version="opset6"> + <data variable_id="past_key_values.5.keypresent.5.key" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2323" name="Assign_333251" type="Assign" version="opset6"> + <data variable_id="past_key_values.5.valuepresent.5.value" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2322" name="Assign_333253" type="Assign" version="opset6"> + <data variable_id="past_key_values.6.keypresent.6.key" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2321" name="Assign_333255" type="Assign" version="opset6"> + <data variable_id="past_key_values.6.valuepresent.6.value" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2320" name="Assign_333257" type="Assign" version="opset6"> + <data variable_id="past_key_values.7.keypresent.7.key" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2319" name="Assign_333259" type="Assign" version="opset6"> + <data variable_id="past_key_values.7.valuepresent.7.value" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2318" name="Assign_333261" type="Assign" version="opset6"> + <data variable_id="past_key_values.8.keypresent.8.key" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2317" name="Assign_333263" type="Assign" version="opset6"> + <data variable_id="past_key_values.8.valuepresent.8.value" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2316" name="Assign_333265" type="Assign" version="opset6"> + <data variable_id="past_key_values.9.keypresent.9.key" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="2266" name="Assign_333267" type="Assign" version="opset6"> + <data variable_id="past_key_values.9.valuepresent.9.value" /> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </input> + <output> + <port id="1" precision="FP32"> + <dim>-1</dim> + <dim>8</dim> + <dim>-1</dim> + <dim>128</dim> + </port> + </output> + </layer> + <layer id="11391" name="Result_122122" type="Result" version="opset1"> + <input> + <port id="0" precision="FP32"> + <dim>-1</dim> + <dim>-1</dim> + <dim>152064</dim> + </port> + </input> + </layer> + </layers> + <edges> + <edge from-layer="0" from-port="0" to-layer="3295" to-port="1" /> + <edge from-layer="0" from-port="0" to-layer="2537" to-port="1" /> + <edge from-layer="0" from-port="0" to-layer="6775" to-port="1" /> + <edge from-layer="0" from-port="0" to-layer="2599" to-port="1" /> + <edge from-layer="0" from-port="0" to-layer="6945" to-port="1" /> + <edge from-layer="0" from-port="0" to-layer="2769" to-port="1" /> + <edge from-layer="0" from-port="0" to-layer="2831" to-port="1" /> + <edge from-layer="0" from-port="0" to-layer="7007" to-port="1" /> + <edge from-layer="0" from-port="0" to-layer="3001" to-port="1" /> + <edge from-layer="0" from-port="0" to-layer="3063" to-port="1" /> + <edge from-layer="0" from-port="0" to-layer="7177" to-port="1" /> + <edge from-layer="0" from-port="0" to-layer="3233" to-port="1" /> + <edge from-layer="0" from-port="0" to-layer="7239" to-port="1" /> + <edge from-layer="0" from-port="0" to-layer="501" to-port="1" /> + <edge from-layer="0" from-port="0" to-layer="7409" to-port="1" /> + <edge from-layer="0" from-port="0" to-layer="3465" to-port="1" /> + <edge from-layer="0" from-port="0" to-layer="3527" to-port="1" /> + <edge from-layer="0" from-port="0" to-layer="7471" to-port="1" /> + <edge from-layer="0" from-port="0" to-layer="177" to-port="1" /> + <edge from-layer="0" from-port="0" to-layer="3697" to-port="1" /> + <edge from-layer="0" from-port="0" to-layer="7641" to-port="1" /> + <edge from-layer="0" from-port="0" to-layer="3759" to-port="1" /> + <edge from-layer="0" from-port="0" to-layer="439" to-port="1" /> + <edge from-layer="0" from-port="0" to-layer="7703" to-port="1" /> + <edge from-layer="0" from-port="0" to-layer="3929" to-port="1" /> + <edge from-layer="0" from-port="0" to-layer="3991" to-port="1" /> + <edge from-layer="0" from-port="0" to-layer="2063" to-port="1" /> + <edge from-layer="0" from-port="0" to-layer="1429" to-port="1" /> + <edge from-layer="0" from-port="0" to-layer="6079" to-port="1" /> + <edge from-layer="0" from-port="0" to-layer="1599" to-port="1" /> + <edge from-layer="0" from-port="0" to-layer="1367" to-port="1" /> + <edge from-layer="0" from-port="0" to-layer="6249" to-port="1" /> + <edge from-layer="0" from-port="0" to-layer="1661" to-port="1" /> + <edge from-layer="0" from-port="0" to-layer="1197" to-port="1" /> + <edge from-layer="0" from-port="0" to-layer="110" to-port="1" /> + <edge from-layer="0" from-port="0" to-layer="1831" to-port="1" /> + <edge from-layer="0" from-port="0" to-layer="6311" to-port="1" /> + <edge from-layer="0" from-port="0" to-layer="1135" to-port="1" /> + <edge from-layer="0" from-port="0" to-layer="1893" to-port="1" /> + <edge from-layer="0" from-port="0" to-layer="7873" to-port="1" /> + <edge from-layer="0" from-port="0" to-layer="965" to-port="1" /> + <edge from-layer="0" from-port="0" to-layer="6481" to-port="1" /> + <edge from-layer="0" from-port="0" to-layer="2125" to-port="1" /> + <edge from-layer="0" from-port="0" to-layer="6543" to-port="1" /> + <edge from-layer="0" from-port="0" to-layer="903" to-port="1" /> + <edge from-layer="0" from-port="0" to-layer="2275" to-port="1" /> + <edge from-layer="0" from-port="0" to-layer="2333" to-port="1" /> + <edge from-layer="0" from-port="0" to-layer="733" to-port="1" /> + <edge from-layer="0" from-port="0" to-layer="6017" to-port="1" /> + <edge from-layer="0" from-port="0" to-layer="6713" to-port="1" /> + <edge from-layer="0" from-port="0" to-layer="671" to-port="1" /> + <edge from-layer="0" from-port="0" to-layer="9559" to-port="1" /> + <edge from-layer="0" from-port="0" to-layer="9033" to-port="1" /> + <edge from-layer="0" from-port="0" to-layer="7935" to-port="1" /> + <edge from-layer="0" from-port="0" to-layer="9095" to-port="1" /> + <edge from-layer="0" from-port="0" to-layer="5615" to-port="1" /> + <edge from-layer="0" from-port="0" to-layer="9265" to-port="1" /> + <edge from-layer="0" from-port="0" to-layer="11101" to-port="1" /> + <edge from-layer="0" from-port="0" to-layer="10951" to-port="1" /> + <edge from-layer="0" from-port="0" to-layer="9327" to-port="1" /> + <edge from-layer="0" from-port="0" to-layer="5847" to-port="1" /> + <edge from-layer="0" from-port="0" to-layer="10889" to-port="1" /> + <edge from-layer="0" from-port="0" to-layer="9497" to-port="1" /> + <edge from-layer="0" from-port="0" to-layer="10719" to-port="1" /> + <edge from-layer="0" from-port="0" to-layer="5553" to-port="1" /> + <edge from-layer="0" from-port="0" to-layer="10657" to-port="1" /> + <edge from-layer="0" from-port="0" to-layer="16" to-port="1" /> + <edge from-layer="0" from-port="0" to-layer="9729" to-port="1" /> + <edge from-layer="0" from-port="0" to-layer="10487" to-port="1" /> + <edge from-layer="0" from-port="0" to-layer="10425" to-port="1" /> + <edge from-layer="0" from-port="0" to-layer="9791" to-port="1" /> + <edge from-layer="0" from-port="0" to-layer="5785" to-port="1" /> + <edge from-layer="0" from-port="0" to-layer="10255" to-port="1" /> + <edge from-layer="0" from-port="0" to-layer="9961" to-port="1" /> + <edge from-layer="0" from-port="0" to-layer="10193" to-port="1" /> + <edge from-layer="0" from-port="0" to-layer="10023" to-port="1" /> + <edge from-layer="0" from-port="0" to-layer="8863" to-port="1" /> + <edge from-layer="0" from-port="0" to-layer="4161" to-port="1" /> + <edge from-layer="0" from-port="0" to-layer="4223" to-port="1" /> + <edge from-layer="0" from-port="0" to-layer="8105" to-port="1" /> + <edge from-layer="0" from-port="0" to-layer="4393" to-port="1" /> + <edge from-layer="0" from-port="0" to-layer="8167" to-port="1" /> + <edge from-layer="0" from-port="0" to-layer="4455" to-port="1" /> + <edge from-layer="0" from-port="0" to-layer="8337" to-port="1" /> + <edge from-layer="0" from-port="0" to-layer="4625" to-port="1" /> + <edge from-layer="0" from-port="0" to-layer="8399" to-port="1" /> + <edge from-layer="0" from-port="0" to-layer="4687" to-port="1" /> + <edge from-layer="0" from-port="0" to-layer="4857" to-port="1" /> + <edge from-layer="0" from-port="0" to-layer="8569" to-port="1" /> + <edge from-layer="0" from-port="0" to-layer="4919" to-port="1" /> + <edge from-layer="0" from-port="0" to-layer="5383" to-port="1" /> + <edge from-layer="0" from-port="0" to-layer="8631" to-port="1" /> + <edge from-layer="0" from-port="0" to-layer="5321" to-port="1" /> + <edge from-layer="0" from-port="0" to-layer="5089" to-port="1" /> + <edge from-layer="0" from-port="0" to-layer="8801" to-port="1" /> + <edge from-layer="0" from-port="0" to-layer="5151" to-port="1" /> + <edge from-layer="1" from-port="0" to-layer="69" to-port="0" /> + <edge from-layer="1" from-port="0" to-layer="60" to-port="0" /> + <edge from-layer="2" from-port="0" to-layer="290" to-port="0" /> + <edge from-layer="2" from-port="0" to-layer="222" to-port="0" /> + <edge from-layer="3" from-port="0" to-layer="5" to-port="0" /> + <edge from-layer="3" from-port="0" to-layer="26" to-port="0" /> + <edge from-layer="4" from-port="0" to-layer="13" to-port="0" /> + <edge from-layer="5" from-port="1" to-layer="8" to-port="0" /> + <edge from-layer="6" from-port="0" to-layer="8" to-port="1" /> + <edge from-layer="7" from-port="0" to-layer="8" to-port="2" /> + <edge from-layer="8" from-port="3" to-layer="4451" to-port="0" /> + <edge from-layer="8" from-port="3" to-layer="7869" to-port="0" /> + <edge from-layer="8" from-port="3" to-layer="3987" to-port="0" /> + <edge from-layer="8" from-port="3" to-layer="4157" to-port="0" /> + <edge from-layer="8" from-port="3" to-layer="7931" to-port="0" /> + <edge from-layer="8" from-port="3" to-layer="4219" to-port="0" /> + <edge from-layer="8" from-port="3" to-layer="8101" to-port="0" /> + <edge from-layer="8" from-port="3" to-layer="4389" to-port="0" /> + <edge from-layer="8" from-port="3" to-layer="8163" to-port="0" /> + <edge from-layer="8" from-port="3" to-layer="3925" to-port="0" /> + <edge from-layer="8" from-port="3" to-layer="8333" to-port="0" /> + <edge from-layer="8" from-port="3" to-layer="4621" to-port="0" /> + <edge from-layer="8" from-port="3" to-layer="4683" to-port="0" /> + <edge from-layer="8" from-port="3" to-layer="8395" to-port="0" /> + <edge from-layer="8" from-port="3" to-layer="4853" to-port="0" /> + <edge from-layer="8" from-port="3" to-layer="8565" to-port="0" /> + <edge from-layer="8" from-port="3" to-layer="435" to-port="0" /> + <edge from-layer="8" from-port="3" to-layer="8627" to-port="0" /> + <edge from-layer="8" from-port="3" to-layer="7699" to-port="0" /> + <edge from-layer="8" from-port="3" to-layer="3755" to-port="0" /> + <edge from-layer="8" from-port="3" to-layer="7637" to-port="0" /> + <edge from-layer="8" from-port="3" to-layer="3693" to-port="0" /> + <edge from-layer="8" from-port="3" to-layer="7467" to-port="0" /> + <edge from-layer="8" from-port="3" to-layer="3523" to-port="0" /> + <edge from-layer="8" from-port="3" to-layer="173" to-port="0" /> + <edge from-layer="8" from-port="3" to-layer="7405" to-port="0" /> + <edge from-layer="8" from-port="3" to-layer="3461" to-port="0" /> + <edge from-layer="8" from-port="3" to-layer="7235" to-port="0" /> + <edge from-layer="8" from-port="3" to-layer="3291" to-port="0" /> + <edge from-layer="8" from-port="3" to-layer="3229" to-port="0" /> + <edge from-layer="8" from-port="3" to-layer="7173" to-port="0" /> + <edge from-layer="8" from-port="3" to-layer="3059" to-port="0" /> + <edge from-layer="8" from-port="3" to-layer="10885" to-port="0" /> + <edge from-layer="8" from-port="3" to-layer="10019" to-port="0" /> + <edge from-layer="8" from-port="3" to-layer="10189" to-port="0" /> + <edge from-layer="8" from-port="3" to-layer="10251" to-port="0" /> + <edge from-layer="8" from-port="3" to-layer="12" to-port="0" /> + <edge from-layer="8" from-port="3" to-layer="9957" to-port="0" /> + <edge from-layer="8" from-port="3" to-layer="10421" to-port="0" /> + <edge from-layer="8" from-port="3" to-layer="9787" to-port="0" /> + <edge from-layer="8" from-port="3" to-layer="5781" to-port="0" /> + <edge from-layer="8" from-port="3" to-layer="10483" to-port="0" /> + <edge from-layer="8" from-port="3" to-layer="9725" to-port="0" /> + <edge from-layer="8" from-port="3" to-layer="10653" to-port="0" /> + <edge from-layer="8" from-port="3" to-layer="9555" to-port="0" /> + <edge from-layer="8" from-port="3" to-layer="10715" to-port="0" /> + <edge from-layer="8" from-port="3" to-layer="9493" to-port="0" /> + <edge from-layer="8" from-port="3" to-layer="5843" to-port="0" /> + <edge from-layer="8" from-port="3" to-layer="4915" to-port="0" /> + <edge from-layer="8" from-port="3" to-layer="9323" to-port="0" /> + <edge from-layer="8" from-port="3" to-layer="10947" to-port="0" /> + <edge from-layer="8" from-port="3" to-layer="11097" to-port="0" /> + <edge from-layer="8" from-port="3" to-layer="9261" to-port="0" /> + <edge from-layer="8" from-port="3" to-layer="9091" to-port="0" /> + <edge from-layer="8" from-port="3" to-layer="5611" to-port="0" /> + <edge from-layer="8" from-port="3" to-layer="5549" to-port="0" /> + <edge from-layer="8" from-port="3" to-layer="9029" to-port="0" /> + <edge from-layer="8" from-port="3" to-layer="5379" to-port="0" /> + <edge from-layer="8" from-port="3" to-layer="8859" to-port="0" /> + <edge from-layer="8" from-port="3" to-layer="5317" to-port="0" /> + <edge from-layer="8" from-port="3" to-layer="8797" to-port="0" /> + <edge from-layer="8" from-port="3" to-layer="5147" to-port="0" /> + <edge from-layer="8" from-port="3" to-layer="5085" to-port="0" /> + <edge from-layer="8" from-port="3" to-layer="1425" to-port="0" /> + <edge from-layer="8" from-port="3" to-layer="729" to-port="0" /> + <edge from-layer="8" from-port="3" to-layer="2271" to-port="0" /> + <edge from-layer="8" from-port="3" to-layer="899" to-port="0" /> + <edge from-layer="8" from-port="3" to-layer="6941" to-port="0" /> + <edge from-layer="8" from-port="3" to-layer="2329" to-port="0" /> + <edge from-layer="8" from-port="3" to-layer="2765" to-port="0" /> + <edge from-layer="8" from-port="3" to-layer="1363" to-port="0" /> + <edge from-layer="8" from-port="3" to-layer="106" to-port="0" /> + <edge from-layer="8" from-port="3" to-layer="6245" to-port="0" /> + <edge from-layer="8" from-port="3" to-layer="1595" to-port="0" /> + <edge from-layer="8" from-port="3" to-layer="1193" to-port="0" /> + <edge from-layer="8" from-port="3" to-layer="2595" to-port="0" /> + <edge from-layer="8" from-port="3" to-layer="6709" to-port="0" /> + <edge from-layer="8" from-port="3" to-layer="1657" to-port="0" /> + <edge from-layer="8" from-port="3" to-layer="2533" to-port="0" /> + <edge from-layer="8" from-port="3" to-layer="497" to-port="0" /> + <edge from-layer="8" from-port="3" to-layer="667" to-port="0" /> + <edge from-layer="8" from-port="3" to-layer="6013" to-port="0" /> + <edge from-layer="8" from-port="3" to-layer="6771" to-port="0" /> + <edge from-layer="8" from-port="3" to-layer="2827" to-port="0" /> + <edge from-layer="8" from-port="3" to-layer="2059" to-port="0" /> + <edge from-layer="8" from-port="3" to-layer="6307" to-port="0" /> + <edge from-layer="8" from-port="3" to-layer="6477" to-port="0" /> + <edge from-layer="8" from-port="3" to-layer="7003" to-port="0" /> + <edge from-layer="8" from-port="3" to-layer="1131" to-port="0" /> + <edge from-layer="8" from-port="3" to-layer="961" to-port="0" /> + <edge from-layer="8" from-port="3" to-layer="2121" to-port="0" /> + <edge from-layer="8" from-port="3" to-layer="1827" to-port="0" /> + <edge from-layer="8" from-port="3" to-layer="6075" to-port="0" /> + <edge from-layer="8" from-port="3" to-layer="2997" to-port="0" /> + <edge from-layer="8" from-port="3" to-layer="6539" to-port="0" /> + <edge from-layer="8" from-port="3" to-layer="1889" to-port="0" /> + <edge from-layer="9" from-port="0" to-layer="12" to-port="1" /> + <edge from-layer="10" from-port="0" to-layer="12" to-port="2" /> + <edge from-layer="11" from-port="0" to-layer="12" to-port="3" /> + <edge from-layer="12" from-port="4" to-layer="13" to-port="1" /> + <edge from-layer="13" from-port="2" to-layer="14" to-port="0" /> + <edge from-layer="14" from-port="1" to-layer="16" to-port="0" /> + <edge from-layer="15" from-port="0" to-layer="16" to-port="2" /> + <edge from-layer="16" from-port="3" to-layer="2265" to-port="0" /> + <edge from-layer="17" from-port="0" to-layer="2246" to-port="0" /> + <edge from-layer="18" from-port="0" to-layer="19" to-port="0" /> + <edge from-layer="19" from-port="1" to-layer="22" to-port="0" /> + <edge from-layer="20" from-port="0" to-layer="21" to-port="0" /> + <edge from-layer="21" from-port="1" to-layer="22" to-port="1" /> + <edge from-layer="22" from-port="2" to-layer="24" to-port="0" /> + <edge from-layer="23" from-port="0" to-layer="24" to-port="1" /> + <edge from-layer="24" from-port="2" to-layer="25" to-port="0" /> + <edge from-layer="25" from-port="1" to-layer="28" to-port="0" /> + <edge from-layer="26" from-port="1" to-layer="28" to-port="1" /> + <edge from-layer="27" from-port="0" to-layer="28" to-port="2" /> + <edge from-layer="28" from-port="3" to-layer="39" to-port="0" /> + <edge from-layer="28" from-port="3" to-layer="32" to-port="0" /> + <edge from-layer="28" from-port="3" to-layer="331" to-port="0" /> + <edge from-layer="29" from-port="0" to-layer="40" to-port="0" /> + <edge from-layer="30" from-port="0" to-layer="38" to-port="0" /> + <edge from-layer="31" from-port="0" to-layer="32" to-port="1" /> + <edge from-layer="32" from-port="2" to-layer="34" to-port="0" /> + <edge from-layer="33" from-port="0" to-layer="34" to-port="1" /> + <edge from-layer="34" from-port="2" to-layer="36" to-port="0" /> + <edge from-layer="35" from-port="0" to-layer="36" to-port="1" /> + <edge from-layer="36" from-port="2" to-layer="37" to-port="0" /> + <edge from-layer="37" from-port="1" to-layer="38" to-port="1" /> + <edge from-layer="38" from-port="2" to-layer="39" to-port="1" /> + <edge from-layer="39" from-port="2" to-layer="40" to-port="1" /> + <edge from-layer="40" from-port="2" to-layer="51" to-port="0" /> + <edge from-layer="40" from-port="2" to-layer="198" to-port="0" /> + <edge from-layer="40" from-port="2" to-layer="188" to-port="0" /> + <edge from-layer="40" from-port="2" to-layer="121" to-port="0" /> + <edge from-layer="41" from-port="0" to-layer="42" to-port="0" /> + <edge from-layer="42" from-port="1" to-layer="45" to-port="0" /> + <edge from-layer="43" from-port="0" to-layer="44" to-port="0" /> + <edge from-layer="44" from-port="1" to-layer="45" to-port="1" /> + <edge from-layer="45" from-port="2" to-layer="47" to-port="0" /> + <edge from-layer="46" from-port="0" to-layer="47" to-port="1" /> + <edge from-layer="47" from-port="2" to-layer="49" to-port="0" /> + <edge from-layer="48" from-port="0" to-layer="49" to-port="1" /> + <edge from-layer="49" from-port="2" to-layer="50" to-port="0" /> + <edge from-layer="50" from-port="1" to-layer="51" to-port="1" /> + <edge from-layer="51" from-port="2" to-layer="54" to-port="0" /> + <edge from-layer="52" from-port="0" to-layer="53" to-port="0" /> + <edge from-layer="53" from-port="1" to-layer="54" to-port="1" /> + <edge from-layer="54" from-port="2" to-layer="56" to-port="0" /> + <edge from-layer="55" from-port="0" to-layer="56" to-port="1" /> + <edge from-layer="56" from-port="2" to-layer="58" to-port="0" /> + <edge from-layer="57" from-port="0" to-layer="58" to-port="1" /> + <edge from-layer="58" from-port="2" to-layer="96" to-port="0" /> + <edge from-layer="58" from-port="2" to-layer="78" to-port="0" /> + <edge from-layer="58" from-port="2" to-layer="77" to-port="0" /> + <edge from-layer="58" from-port="2" to-layer="90" to-port="0" /> + <edge from-layer="59" from-port="0" to-layer="67" to-port="0" /> + <edge from-layer="60" from-port="1" to-layer="63" to-port="0" /> + <edge from-layer="61" from-port="0" to-layer="63" to-port="1" /> + <edge from-layer="62" from-port="0" to-layer="63" to-port="2" /> + <edge from-layer="63" from-port="3" to-layer="66" to-port="0" /> + <edge from-layer="64" from-port="0" to-layer="66" to-port="1" /> + <edge from-layer="65" from-port="0" to-layer="66" to-port="2" /> + <edge from-layer="66" from-port="3" to-layer="67" to-port="1" /> + <edge from-layer="67" from-port="2" to-layer="71" to-port="0" /> + <edge from-layer="68" from-port="0" to-layer="69" to-port="1" /> + <edge from-layer="68" from-port="0" to-layer="290" to-port="1" /> + <edge from-layer="68" from-port="0" to-layer="266" to-port="1" /> + <edge from-layer="68" from-port="0" to-layer="99" to-port="1" /> + <edge from-layer="68" from-port="0" to-layer="76" to-port="1" /> + <edge from-layer="69" from-port="2" to-layer="70" to-port="0" /> + <edge from-layer="70" from-port="1" to-layer="71" to-port="1" /> + <edge from-layer="71" from-port="2" to-layer="73" to-port="0" /> + <edge from-layer="72" from-port="0" to-layer="73" to-port="1" /> + <edge from-layer="73" from-port="2" to-layer="74" to-port="0" /> + <edge from-layer="73" from-port="2" to-layer="74" to-port="1" /> + <edge from-layer="74" from-port="2" to-layer="98" to-port="0" /> + <edge from-layer="74" from-port="2" to-layer="75" to-port="0" /> + <edge from-layer="75" from-port="1" to-layer="76" to-port="0" /> + <edge from-layer="76" from-port="2" to-layer="1618" to-port="1" /> + <edge from-layer="76" from-port="2" to-layer="10396" to-port="1" /> + <edge from-layer="76" from-port="2" to-layer="1850" to-port="1" /> + <edge from-layer="76" from-port="2" to-layer="642" to-port="1" /> + <edge from-layer="76" from-port="2" to-layer="1386" to-port="1" /> + <edge from-layer="76" from-port="2" to-layer="5804" to-port="1" /> + <edge from-layer="76" from-port="2" to-layer="10444" to-port="1" /> + <edge from-layer="76" from-port="2" to-layer="10860" to-port="1" /> + <edge from-layer="76" from-port="2" to-layer="5756" to-port="1" /> + <edge from-layer="76" from-port="2" to-layer="10212" to-port="1" /> + <edge from-layer="76" from-port="2" to-layer="10164" to-port="1" /> + <edge from-layer="76" from-port="2" to-layer="1338" to-port="1" /> + <edge from-layer="76" from-port="2" to-layer="1802" to-port="1" /> + <edge from-layer="76" from-port="2" to-layer="1570" to-port="1" /> + <edge from-layer="76" from-port="2" to-layer="10628" to-port="1" /> + <edge from-layer="76" from-port="2" to-layer="10676" to-port="1" /> + <edge from-layer="76" from-port="2" to-layer="2740" to-port="1" /> + <edge from-layer="76" from-port="2" to-layer="410" to-port="1" /> + <edge from-layer="76" from-port="2" to-layer="4412" to-port="1" /> + <edge from-layer="76" from-port="2" to-layer="4364" to-port="1" /> + <edge from-layer="76" from-port="2" to-layer="690" to-port="1" /> + <edge from-layer="76" from-port="2" to-layer="4180" to-port="1" /> + <edge from-layer="76" from-port="2" to-layer="4132" to-port="1" /> + <edge from-layer="76" from-port="2" to-layer="2556" to-port="1" /> + <edge from-layer="76" from-port="2" to-layer="3948" to-port="1" /> + <edge from-layer="76" from-port="2" to-layer="3900" to-port="1" /> + <edge from-layer="76" from-port="2" to-layer="3716" to-port="1" /> + <edge from-layer="76" from-port="2" to-layer="2508" to-port="1" /> + <edge from-layer="76" from-port="2" to-layer="3668" to-port="1" /> + <edge from-layer="76" from-port="2" to-layer="3484" to-port="1" /> + <edge from-layer="76" from-port="2" to-layer="2788" to-port="1" /> + <edge from-layer="76" from-port="2" to-layer="458" to-port="1" /> + <edge from-layer="76" from-port="2" to-layer="3436" to-port="1" /> + <edge from-layer="76" from-port="2" to-layer="3252" to-port="1" /> + <edge from-layer="76" from-port="2" to-layer="3204" to-port="1" /> + <edge from-layer="76" from-port="2" to-layer="2972" to-port="1" /> + <edge from-layer="76" from-port="2" to-layer="3020" to-port="1" /> + <edge from-layer="76" from-port="2" to-layer="5108" to-port="1" /> + <edge from-layer="76" from-port="2" to-layer="1154" to-port="1" /> + <edge from-layer="76" from-port="2" to-layer="2034" to-port="1" /> + <edge from-layer="76" from-port="2" to-layer="11120" to-port="1" /> + <edge from-layer="76" from-port="2" to-layer="11246" to-port="1" /> + <edge from-layer="76" from-port="2" to-layer="5572" to-port="1" /> + <edge from-layer="76" from-port="2" to-layer="1106" to-port="1" /> + <edge from-layer="76" from-port="2" to-layer="2082" to-port="1" /> + <edge from-layer="76" from-port="2" to-layer="5524" to-port="1" /> + <edge from-layer="76" from-port="2" to-layer="5340" to-port="1" /> + <edge from-layer="76" from-port="2" to-layer="5292" to-port="1" /> + <edge from-layer="76" from-port="2" to-layer="10908" to-port="1" /> + <edge from-layer="76" from-port="2" to-layer="5060" to-port="1" /> + <edge from-layer="76" from-port="2" to-layer="4876" to-port="1" /> + <edge from-layer="76" from-port="2" to-layer="922" to-port="1" /> + <edge from-layer="76" from-port="2" to-layer="4828" to-port="1" /> + <edge from-layer="76" from-port="2" to-layer="2294" to-port="1" /> + <edge from-layer="76" from-port="2" to-layer="4644" to-port="1" /> + <edge from-layer="76" from-port="2" to-layer="874" to-port="1" /> + <edge from-layer="76" from-port="2" to-layer="2353" to-port="1" /> + <edge from-layer="76" from-port="2" to-layer="4596" to-port="1" /> + <edge from-layer="76" from-port="2" to-layer="7892" to-port="1" /> + <edge from-layer="76" from-port="2" to-layer="8356" to-port="1" /> + <edge from-layer="76" from-port="2" to-layer="6916" to-port="1" /> + <edge from-layer="76" from-port="2" to-layer="7844" to-port="1" /> + <edge from-layer="76" from-port="2" to-layer="9748" to-port="1" /> + <edge from-layer="76" from-port="2" to-layer="6964" to-port="1" /> + <edge from-layer="76" from-port="2" to-layer="8308" to-port="1" /> + <edge from-layer="76" from-port="2" to-layer="9004" to-port="1" /> + <edge from-layer="76" from-port="2" to-layer="7428" to-port="1" /> + <edge from-layer="76" from-port="2" to-layer="7148" to-port="1" /> + <edge from-layer="76" from-port="2" to-layer="9700" to-port="1" /> + <edge from-layer="76" from-port="2" to-layer="6220" to-port="1" /> + <edge from-layer="76" from-port="2" to-layer="9468" to-port="1" /> + <edge from-layer="76" from-port="2" to-layer="8124" to-port="1" /> + <edge from-layer="76" from-port="2" to-layer="5988" to-port="1" /> + <edge from-layer="76" from-port="2" to-layer="6268" to-port="1" /> + <edge from-layer="76" from-port="2" to-layer="7196" to-port="1" /> + <edge from-layer="76" from-port="2" to-layer="9516" to-port="1" /> + <edge from-layer="76" from-port="2" to-layer="8076" to-port="1" /> + <edge from-layer="76" from-port="2" to-layer="9052" to-port="1" /> + <edge from-layer="76" from-port="2" to-layer="7380" to-port="1" /> + <edge from-layer="76" from-port="2" to-layer="9980" to-port="1" /> + <edge from-layer="76" from-port="2" to-layer="7660" to-port="1" /> + <edge from-layer="76" from-port="2" to-layer="6500" to-port="1" /> + <edge from-layer="76" from-port="2" to-layer="8772" to-port="1" /> + <edge from-layer="76" from-port="2" to-layer="129" to-port="1" /> + <edge from-layer="76" from-port="2" to-layer="6684" to-port="1" /> + <edge from-layer="76" from-port="2" to-layer="8588" to-port="1" /> + <edge from-layer="76" from-port="2" to-layer="6452" to-port="1" /> + <edge from-layer="76" from-port="2" to-layer="9284" to-port="1" /> + <edge from-layer="76" from-port="2" to-layer="9236" to-port="1" /> + <edge from-layer="76" from-port="2" to-layer="8540" to-port="1" /> + <edge from-layer="76" from-port="2" to-layer="6036" to-port="1" /> + <edge from-layer="76" from-port="2" to-layer="7612" to-port="1" /> + <edge from-layer="76" from-port="2" to-layer="8820" to-port="1" /> + <edge from-layer="76" from-port="2" to-layer="77" to-port="1" /> + <edge from-layer="76" from-port="2" to-layer="9932" to-port="1" /> + <edge from-layer="76" from-port="2" to-layer="6732" to-port="1" /> + <edge from-layer="77" from-port="2" to-layer="101" to-port="0" /> + <edge from-layer="78" from-port="1" to-layer="81" to-port="0" /> + <edge from-layer="79" from-port="0" to-layer="3951" to-port="1" /> + <edge from-layer="79" from-port="0" to-layer="3903" to-port="1" /> + <edge from-layer="79" from-port="0" to-layer="7895" to-port="1" /> + <edge from-layer="79" from-port="0" to-layer="7847" to-port="1" /> + <edge from-layer="79" from-port="0" to-layer="4135" to-port="1" /> + <edge from-layer="79" from-port="0" to-layer="413" to-port="1" /> + <edge from-layer="79" from-port="0" to-layer="7663" to-port="1" /> + <edge from-layer="79" from-port="0" to-layer="1341" to-port="1" /> + <edge from-layer="79" from-port="0" to-layer="5807" to-port="1" /> + <edge from-layer="79" from-port="0" to-layer="1157" to-port="1" /> + <edge from-layer="79" from-port="0" to-layer="4879" to-port="1" /> + <edge from-layer="79" from-port="0" to-layer="4831" to-port="1" /> + <edge from-layer="79" from-port="0" to-layer="8543" to-port="1" /> + <edge from-layer="79" from-port="0" to-layer="4647" to-port="1" /> + <edge from-layer="79" from-port="0" to-layer="8359" to-port="1" /> + <edge from-layer="79" from-port="0" to-layer="4599" to-port="1" /> + <edge from-layer="79" from-port="0" to-layer="1389" to-port="1" /> + <edge from-layer="79" from-port="0" to-layer="8311" to-port="1" /> + <edge from-layer="79" from-port="0" to-layer="4415" to-port="1" /> + <edge from-layer="79" from-port="0" to-layer="8591" to-port="1" /> + <edge from-layer="79" from-port="0" to-layer="8127" to-port="1" /> + <edge from-layer="79" from-port="0" to-layer="4367" to-port="1" /> + <edge from-layer="79" from-port="0" to-layer="4183" to-port="1" /> + <edge from-layer="79" from-port="0" to-layer="8079" to-port="1" /> + <edge from-layer="79" from-port="0" to-layer="6039" to-port="1" /> + <edge from-layer="79" from-port="0" to-layer="2975" to-port="1" /> + <edge from-layer="79" from-port="0" to-layer="2791" to-port="1" /> + <edge from-layer="79" from-port="0" to-layer="6967" to-port="1" /> + <edge from-layer="79" from-port="0" to-layer="2743" to-port="1" /> + <edge from-layer="79" from-port="0" to-layer="6919" to-port="1" /> + <edge from-layer="79" from-port="0" to-layer="1853" to-port="1" /> + <edge from-layer="79" from-port="0" to-layer="2559" to-port="1" /> + <edge from-layer="79" from-port="0" to-layer="6735" to-port="1" /> + <edge from-layer="79" from-port="0" to-layer="2511" to-port="1" /> + <edge from-layer="79" from-port="0" to-layer="1805" to-port="1" /> + <edge from-layer="79" from-port="0" to-layer="2356" to-port="1" /> + <edge from-layer="79" from-port="0" to-layer="6687" to-port="1" /> + <edge from-layer="79" from-port="0" to-layer="2297" to-port="1" /> + <edge from-layer="79" from-port="0" to-layer="132" to-port="1" /> + <edge from-layer="79" from-port="0" to-layer="2037" to-port="1" /> + <edge from-layer="79" from-port="0" to-layer="6503" to-port="1" /> + <edge from-layer="79" from-port="0" to-layer="2085" to-port="1" /> + <edge from-layer="79" from-port="0" to-layer="6455" to-port="1" /> + <edge from-layer="79" from-port="0" to-layer="3439" to-port="1" /> + <edge from-layer="79" from-port="0" to-layer="3719" to-port="1" /> + <edge from-layer="79" from-port="0" to-layer="7615" to-port="1" /> + <edge from-layer="79" from-port="0" to-layer="3671" to-port="1" /> + <edge from-layer="79" from-port="0" to-layer="6223" to-port="1" /> + <edge from-layer="79" from-port="0" to-layer="3487" to-port="1" /> + <edge from-layer="79" from-port="0" to-layer="7431" to-port="1" /> + <edge from-layer="79" from-port="0" to-layer="1621" to-port="1" /> + <edge from-layer="79" from-port="0" to-layer="461" to-port="1" /> + <edge from-layer="79" from-port="0" to-layer="1573" to-port="1" /> + <edge from-layer="79" from-port="0" to-layer="7383" to-port="1" /> + <edge from-layer="79" from-port="0" to-layer="3255" to-port="1" /> + <edge from-layer="79" from-port="0" to-layer="7199" to-port="1" /> + <edge from-layer="79" from-port="0" to-layer="3207" to-port="1" /> + <edge from-layer="79" from-port="0" to-layer="6271" to-port="1" /> + <edge from-layer="79" from-port="0" to-layer="3023" to-port="1" /> + <edge from-layer="79" from-port="0" to-layer="7151" to-port="1" /> + <edge from-layer="79" from-port="0" to-layer="5991" to-port="1" /> + <edge from-layer="79" from-port="0" to-layer="5575" to-port="1" /> + <edge from-layer="79" from-port="0" to-layer="10631" to-port="1" /> + <edge from-layer="79" from-port="0" to-layer="1109" to-port="1" /> + <edge from-layer="79" from-port="0" to-layer="5343" to-port="1" /> + <edge from-layer="79" from-port="0" to-layer="645" to-port="1" /> + <edge from-layer="79" from-port="0" to-layer="9703" to-port="1" /> + <edge from-layer="79" from-port="0" to-layer="9007" to-port="1" /> + <edge from-layer="79" from-port="0" to-layer="10679" to-port="1" /> + <edge from-layer="79" from-port="0" to-layer="5527" to-port="1" /> + <edge from-layer="79" from-port="0" to-layer="5759" to-port="1" /> + <edge from-layer="79" from-port="0" to-layer="9055" to-port="1" /> + <edge from-layer="79" from-port="0" to-layer="9519" to-port="1" /> + <edge from-layer="79" from-port="0" to-layer="5063" to-port="1" /> + <edge from-layer="79" from-port="0" to-layer="10863" to-port="1" /> + <edge from-layer="79" from-port="0" to-layer="9983" to-port="1" /> + <edge from-layer="79" from-port="0" to-layer="10215" to-port="1" /> + <edge from-layer="79" from-port="0" to-layer="877" to-port="1" /> + <edge from-layer="79" from-port="0" to-layer="9239" to-port="1" /> + <edge from-layer="79" from-port="0" to-layer="925" to-port="1" /> + <edge from-layer="79" from-port="0" to-layer="11249" to-port="1" /> + <edge from-layer="79" from-port="0" to-layer="9471" to-port="1" /> + <edge from-layer="79" from-port="0" to-layer="10911" to-port="1" /> + <edge from-layer="79" from-port="0" to-layer="11123" to-port="1" /> + <edge from-layer="79" from-port="0" to-layer="9287" to-port="1" /> + <edge from-layer="79" from-port="0" to-layer="8775" to-port="1" /> + <edge from-layer="79" from-port="0" to-layer="10447" to-port="1" /> + <edge from-layer="79" from-port="0" to-layer="5111" to-port="1" /> + <edge from-layer="79" from-port="0" to-layer="9751" to-port="1" /> + <edge from-layer="79" from-port="0" to-layer="693" to-port="1" /> + <edge from-layer="79" from-port="0" to-layer="9935" to-port="1" /> + <edge from-layer="79" from-port="0" to-layer="5295" to-port="1" /> + <edge from-layer="79" from-port="0" to-layer="81" to-port="1" /> + <edge from-layer="79" from-port="0" to-layer="10399" to-port="1" /> + <edge from-layer="79" from-port="0" to-layer="8823" to-port="1" /> + <edge from-layer="79" from-port="0" to-layer="10167" to-port="1" /> + <edge from-layer="80" from-port="0" to-layer="81" to-port="2" /> + <edge from-layer="81" from-port="3" to-layer="83" to-port="0" /> + <edge from-layer="82" from-port="0" to-layer="1854" to-port="1" /> + <edge from-layer="82" from-port="0" to-layer="9472" to-port="1" /> + <edge from-layer="82" from-port="0" to-layer="6736" to-port="1" /> + <edge from-layer="82" from-port="0" to-layer="1622" to-port="1" /> + <edge from-layer="82" from-port="0" to-layer="6688" to-port="1" /> + <edge from-layer="82" from-port="0" to-layer="3256" to-port="1" /> + <edge from-layer="82" from-port="0" to-layer="2560" to-port="1" /> + <edge from-layer="82" from-port="0" to-layer="462" to-port="1" /> + <edge from-layer="82" from-port="0" to-layer="878" to-port="1" /> + <edge from-layer="82" from-port="0" to-layer="133" to-port="1" /> + <edge from-layer="82" from-port="0" to-layer="3440" to-port="1" /> + <edge from-layer="82" from-port="0" to-layer="2512" to-port="1" /> + <edge from-layer="82" from-port="0" to-layer="7384" to-port="1" /> + <edge from-layer="82" from-port="0" to-layer="6224" to-port="1" /> + <edge from-layer="82" from-port="0" to-layer="10912" to-port="1" /> + <edge from-layer="82" from-port="0" to-layer="646" to-port="1" /> + <edge from-layer="82" from-port="0" to-layer="9752" to-port="1" /> + <edge from-layer="82" from-port="0" to-layer="3488" to-port="1" /> + <edge from-layer="82" from-port="0" to-layer="10400" to-port="1" /> + <edge from-layer="82" from-port="0" to-layer="9288" to-port="1" /> + <edge from-layer="82" from-port="0" to-layer="6920" to-port="1" /> + <edge from-layer="82" from-port="0" to-layer="6272" to-port="1" /> + <edge from-layer="82" from-port="0" to-layer="10632" to-port="1" /> + <edge from-layer="82" from-port="0" to-layer="2792" to-port="1" /> + <edge from-layer="82" from-port="0" to-layer="9936" to-port="1" /> + <edge from-layer="82" from-port="0" to-layer="6968" to-port="1" /> + <edge from-layer="82" from-port="0" to-layer="1806" to-port="1" /> + <edge from-layer="82" from-port="0" to-layer="5992" to-port="1" /> + <edge from-layer="82" from-port="0" to-layer="2976" to-port="1" /> + <edge from-layer="82" from-port="0" to-layer="9704" to-port="1" /> + <edge from-layer="82" from-port="0" to-layer="2744" to-port="1" /> + <edge from-layer="82" from-port="0" to-layer="694" to-port="1" /> + <edge from-layer="82" from-port="0" to-layer="10864" to-port="1" /> + <edge from-layer="82" from-port="0" to-layer="10680" to-port="1" /> + <edge from-layer="82" from-port="0" to-layer="3024" to-port="1" /> + <edge from-layer="82" from-port="0" to-layer="83" to-port="1" /> + <edge from-layer="82" from-port="0" to-layer="7152" to-port="1" /> + <edge from-layer="82" from-port="0" to-layer="5760" to-port="1" /> + <edge from-layer="82" from-port="0" to-layer="9520" to-port="1" /> + <edge from-layer="82" from-port="0" to-layer="3208" to-port="1" /> + <edge from-layer="82" from-port="0" to-layer="2357" to-port="1" /> + <edge from-layer="82" from-port="0" to-layer="6040" to-port="1" /> + <edge from-layer="82" from-port="0" to-layer="10448" to-port="1" /> + <edge from-layer="82" from-port="0" to-layer="7200" to-port="1" /> + <edge from-layer="82" from-port="0" to-layer="8312" to-port="1" /> + <edge from-layer="82" from-port="0" to-layer="5808" to-port="1" /> + <edge from-layer="82" from-port="0" to-layer="8080" to-port="1" /> + <edge from-layer="82" from-port="0" to-layer="6504" to-port="1" /> + <edge from-layer="82" from-port="0" to-layer="9008" to-port="1" /> + <edge from-layer="82" from-port="0" to-layer="4368" to-port="1" /> + <edge from-layer="82" from-port="0" to-layer="414" to-port="1" /> + <edge from-layer="82" from-port="0" to-layer="8776" to-port="1" /> + <edge from-layer="82" from-port="0" to-layer="8128" to-port="1" /> + <edge from-layer="82" from-port="0" to-layer="5344" to-port="1" /> + <edge from-layer="82" from-port="0" to-layer="10168" to-port="1" /> + <edge from-layer="82" from-port="0" to-layer="4416" to-port="1" /> + <edge from-layer="82" from-port="0" to-layer="1342" to-port="1" /> + <edge from-layer="82" from-port="0" to-layer="8824" to-port="1" /> + <edge from-layer="82" from-port="0" to-layer="4184" to-port="1" /> + <edge from-layer="82" from-port="0" to-layer="1110" to-port="1" /> + <edge from-layer="82" from-port="0" to-layer="5296" to-port="1" /> + <edge from-layer="82" from-port="0" to-layer="4600" to-port="1" /> + <edge from-layer="82" from-port="0" to-layer="2038" to-port="1" /> + <edge from-layer="82" from-port="0" to-layer="8360" to-port="1" /> + <edge from-layer="82" from-port="0" to-layer="2086" to-port="1" /> + <edge from-layer="82" from-port="0" to-layer="4648" to-port="1" /> + <edge from-layer="82" from-port="0" to-layer="1158" to-port="1" /> + <edge from-layer="82" from-port="0" to-layer="8544" to-port="1" /> + <edge from-layer="82" from-port="0" to-layer="5112" to-port="1" /> + <edge from-layer="82" from-port="0" to-layer="4832" to-port="1" /> + <edge from-layer="82" from-port="0" to-layer="6456" to-port="1" /> + <edge from-layer="82" from-port="0" to-layer="10216" to-port="1" /> + <edge from-layer="82" from-port="0" to-layer="7432" to-port="1" /> + <edge from-layer="82" from-port="0" to-layer="3672" to-port="1" /> + <edge from-layer="82" from-port="0" to-layer="2298" to-port="1" /> + <edge from-layer="82" from-port="0" to-layer="11124" to-port="1" /> + <edge from-layer="82" from-port="0" to-layer="7616" to-port="1" /> + <edge from-layer="82" from-port="0" to-layer="1574" to-port="1" /> + <edge from-layer="82" from-port="0" to-layer="8592" to-port="1" /> + <edge from-layer="82" from-port="0" to-layer="3720" to-port="1" /> + <edge from-layer="82" from-port="0" to-layer="9240" to-port="1" /> + <edge from-layer="82" from-port="0" to-layer="11250" to-port="1" /> + <edge from-layer="82" from-port="0" to-layer="7664" to-port="1" /> + <edge from-layer="82" from-port="0" to-layer="3904" to-port="1" /> + <edge from-layer="82" from-port="0" to-layer="926" to-port="1" /> + <edge from-layer="82" from-port="0" to-layer="7848" to-port="1" /> + <edge from-layer="82" from-port="0" to-layer="5576" to-port="1" /> + <edge from-layer="82" from-port="0" to-layer="3952" to-port="1" /> + <edge from-layer="82" from-port="0" to-layer="9984" to-port="1" /> + <edge from-layer="82" from-port="0" to-layer="9056" to-port="1" /> + <edge from-layer="82" from-port="0" to-layer="7896" to-port="1" /> + <edge from-layer="82" from-port="0" to-layer="4136" to-port="1" /> + <edge from-layer="82" from-port="0" to-layer="1390" to-port="1" /> + <edge from-layer="82" from-port="0" to-layer="5064" to-port="1" /> + <edge from-layer="82" from-port="0" to-layer="5528" to-port="1" /> + <edge from-layer="82" from-port="0" to-layer="4880" to-port="1" /> + <edge from-layer="83" from-port="2" to-layer="84" to-port="0" /> + <edge from-layer="84" from-port="1" to-layer="86" to-port="0" /> + <edge from-layer="85" from-port="0" to-layer="86" to-port="1" /> + <edge from-layer="86" from-port="2" to-layer="96" to-port="2" /> + <edge from-layer="86" from-port="2" to-layer="90" to-port="1" /> + <edge from-layer="87" from-port="0" to-layer="90" to-port="2" /> + <edge from-layer="88" from-port="0" to-layer="90" to-port="3" /> + <edge from-layer="89" from-port="0" to-layer="90" to-port="4" /> + <edge from-layer="90" from-port="5" to-layer="92" to-port="0" /> + <edge from-layer="91" from-port="0" to-layer="92" to-port="1" /> + <edge from-layer="92" from-port="2" to-layer="97" to-port="0" /> + <edge from-layer="93" from-port="0" to-layer="96" to-port="1" /> + <edge from-layer="94" from-port="0" to-layer="96" to-port="3" /> + <edge from-layer="95" from-port="0" to-layer="96" to-port="4" /> + <edge from-layer="96" from-port="5" to-layer="97" to-port="1" /> + <edge from-layer="97" from-port="2" to-layer="100" to-port="0" /> + <edge from-layer="98" from-port="1" to-layer="99" to-port="0" /> + <edge from-layer="99" from-port="2" to-layer="6055" to-port="1" /> + <edge from-layer="99" from-port="2" to-layer="1869" to-port="1" /> + <edge from-layer="99" from-port="2" to-layer="1173" to-port="1" /> + <edge from-layer="99" from-port="2" to-layer="2053" to-port="1" /> + <edge from-layer="99" from-port="2" to-layer="1125" to-port="1" /> + <edge from-layer="99" from-port="2" to-layer="1357" to-port="1" /> + <edge from-layer="99" from-port="2" to-layer="1405" to-port="1" /> + <edge from-layer="99" from-port="2" to-layer="941" to-port="1" /> + <edge from-layer="99" from-port="2" to-layer="1589" to-port="1" /> + <edge from-layer="99" from-port="2" to-layer="893" to-port="1" /> + <edge from-layer="99" from-port="2" to-layer="661" to-port="1" /> + <edge from-layer="99" from-port="2" to-layer="1637" to-port="1" /> + <edge from-layer="99" from-port="2" to-layer="6239" to-port="1" /> + <edge from-layer="99" from-port="2" to-layer="1821" to-port="1" /> + <edge from-layer="99" from-port="2" to-layer="709" to-port="1" /> + <edge from-layer="99" from-port="2" to-layer="6287" to-port="1" /> + <edge from-layer="99" from-port="2" to-layer="5127" to-port="1" /> + <edge from-layer="99" from-port="2" to-layer="11265" to-port="1" /> + <edge from-layer="99" from-port="2" to-layer="9071" to-port="1" /> + <edge from-layer="99" from-port="2" to-layer="5591" to-port="1" /> + <edge from-layer="99" from-port="2" to-layer="5543" to-port="1" /> + <edge from-layer="99" from-port="2" to-layer="9023" to-port="1" /> + <edge from-layer="99" from-port="2" to-layer="5359" to-port="1" /> + <edge from-layer="99" from-port="2" to-layer="8839" to-port="1" /> + <edge from-layer="99" from-port="2" to-layer="5311" to-port="1" /> + <edge from-layer="99" from-port="2" to-layer="8791" to-port="1" /> + <edge from-layer="99" from-port="2" to-layer="11139" to-port="1" /> + <edge from-layer="99" from-port="2" to-layer="5079" to-port="1" /> + <edge from-layer="99" from-port="2" to-layer="8607" to-port="1" /> + <edge from-layer="99" from-port="2" to-layer="4895" to-port="1" /> + <edge from-layer="99" from-port="2" to-layer="8559" to-port="1" /> + <edge from-layer="99" from-port="2" to-layer="4847" to-port="1" /> + <edge from-layer="99" from-port="2" to-layer="8375" to-port="1" /> + <edge from-layer="99" from-port="2" to-layer="4663" to-port="1" /> + <edge from-layer="99" from-port="2" to-layer="4615" to-port="1" /> + <edge from-layer="99" from-port="2" to-layer="9719" to-port="1" /> + <edge from-layer="99" from-port="2" to-layer="9999" to-port="1" /> + <edge from-layer="99" from-port="2" to-layer="10183" to-port="1" /> + <edge from-layer="99" from-port="2" to-layer="10231" to-port="1" /> + <edge from-layer="99" from-port="2" to-layer="9951" to-port="1" /> + <edge from-layer="99" from-port="2" to-layer="10415" to-port="1" /> + <edge from-layer="99" from-port="2" to-layer="9767" to-port="1" /> + <edge from-layer="99" from-port="2" to-layer="10463" to-port="1" /> + <edge from-layer="99" from-port="2" to-layer="5775" to-port="1" /> + <edge from-layer="99" from-port="2" to-layer="5823" to-port="1" /> + <edge from-layer="99" from-port="2" to-layer="8327" to-port="1" /> + <edge from-layer="99" from-port="2" to-layer="10647" to-port="1" /> + <edge from-layer="99" from-port="2" to-layer="10695" to-port="1" /> + <edge from-layer="99" from-port="2" to-layer="9535" to-port="1" /> + <edge from-layer="99" from-port="2" to-layer="9487" to-port="1" /> + <edge from-layer="99" from-port="2" to-layer="10879" to-port="1" /> + <edge from-layer="99" from-port="2" to-layer="10927" to-port="1" /> + <edge from-layer="99" from-port="2" to-layer="9303" to-port="1" /> + <edge from-layer="99" from-port="2" to-layer="9255" to-port="1" /> + <edge from-layer="99" from-port="2" to-layer="2575" to-port="1" /> + <edge from-layer="99" from-port="2" to-layer="3271" to-port="1" /> + <edge from-layer="99" from-port="2" to-layer="3223" to-port="1" /> + <edge from-layer="99" from-port="2" to-layer="7167" to-port="1" /> + <edge from-layer="99" from-port="2" to-layer="3039" to-port="1" /> + <edge from-layer="99" from-port="2" to-layer="2991" to-port="1" /> + <edge from-layer="99" from-port="2" to-layer="6983" to-port="1" /> + <edge from-layer="99" from-port="2" to-layer="2807" to-port="1" /> + <edge from-layer="99" from-port="2" to-layer="6935" to-port="1" /> + <edge from-layer="99" from-port="2" to-layer="2759" to-port="1" /> + <edge from-layer="99" from-port="2" to-layer="7215" to-port="1" /> + <edge from-layer="99" from-port="2" to-layer="6007" to-port="1" /> + <edge from-layer="99" from-port="2" to-layer="6751" to-port="1" /> + <edge from-layer="99" from-port="2" to-layer="2527" to-port="1" /> + <edge from-layer="99" from-port="2" to-layer="6703" to-port="1" /> + <edge from-layer="99" from-port="2" to-layer="2372" to-port="1" /> + <edge from-layer="99" from-port="2" to-layer="2313" to-port="1" /> + <edge from-layer="99" from-port="2" to-layer="6519" to-port="1" /> + <edge from-layer="99" from-port="2" to-layer="2101" to-port="1" /> + <edge from-layer="99" from-port="2" to-layer="3919" to-port="1" /> + <edge from-layer="99" from-port="2" to-layer="4431" to-port="1" /> + <edge from-layer="99" from-port="2" to-layer="8143" to-port="1" /> + <edge from-layer="99" from-port="2" to-layer="4383" to-port="1" /> + <edge from-layer="99" from-port="2" to-layer="8095" to-port="1" /> + <edge from-layer="99" from-port="2" to-layer="4199" to-port="1" /> + <edge from-layer="99" from-port="2" to-layer="7911" to-port="1" /> + <edge from-layer="99" from-port="2" to-layer="4151" to-port="1" /> + <edge from-layer="99" from-port="2" to-layer="3967" to-port="1" /> + <edge from-layer="99" from-port="2" to-layer="7863" to-port="1" /> + <edge from-layer="99" from-port="2" to-layer="6471" to-port="1" /> + <edge from-layer="99" from-port="2" to-layer="7679" to-port="1" /> + <edge from-layer="99" from-port="2" to-layer="3735" to-port="1" /> + <edge from-layer="99" from-port="2" to-layer="7631" to-port="1" /> + <edge from-layer="99" from-port="2" to-layer="3687" to-port="1" /> + <edge from-layer="99" from-port="2" to-layer="7447" to-port="1" /> + <edge from-layer="99" from-port="2" to-layer="3503" to-port="1" /> + <edge from-layer="99" from-port="2" to-layer="7399" to-port="1" /> + <edge from-layer="99" from-port="2" to-layer="3455" to-port="1" /> + <edge from-layer="99" from-port="2" to-layer="429" to-port="1" /> + <edge from-layer="99" from-port="2" to-layer="100" to-port="1" /> + <edge from-layer="99" from-port="2" to-layer="148" to-port="1" /> + <edge from-layer="99" from-port="2" to-layer="477" to-port="1" /> + <edge from-layer="100" from-port="2" to-layer="101" to-port="1" /> + <edge from-layer="101" from-port="2" to-layer="315" to-port="0" /> + <edge from-layer="102" from-port="0" to-layer="107" to-port="0" /> + <edge from-layer="103" from-port="0" to-layer="106" to-port="1" /> + <edge from-layer="104" from-port="0" to-layer="106" to-port="2" /> + <edge from-layer="105" from-port="0" to-layer="106" to-port="3" /> + <edge from-layer="106" from-port="4" to-layer="107" to-port="1" /> + <edge from-layer="107" from-port="2" to-layer="108" to-port="0" /> + <edge from-layer="108" from-port="1" to-layer="110" to-port="0" /> + <edge from-layer="109" from-port="0" to-layer="110" to-port="2" /> + <edge from-layer="110" from-port="3" to-layer="153" to-port="0" /> + <edge from-layer="110" from-port="3" to-layer="150" to-port="0" /> + <edge from-layer="111" from-port="0" to-layer="112" to-port="0" /> + <edge from-layer="112" from-port="1" to-layer="115" to-port="0" /> + <edge from-layer="113" from-port="0" to-layer="114" to-port="0" /> + <edge from-layer="114" from-port="1" to-layer="115" to-port="1" /> + <edge from-layer="115" from-port="2" to-layer="117" to-port="0" /> + <edge from-layer="116" from-port="0" to-layer="117" to-port="1" /> + <edge from-layer="117" from-port="2" to-layer="119" to-port="0" /> + <edge from-layer="118" from-port="0" to-layer="119" to-port="1" /> + <edge from-layer="119" from-port="2" to-layer="120" to-port="0" /> + <edge from-layer="120" from-port="1" to-layer="121" to-port="1" /> + <edge from-layer="121" from-port="2" to-layer="124" to-port="0" /> + <edge from-layer="122" from-port="0" to-layer="123" to-port="0" /> + <edge from-layer="123" from-port="1" to-layer="124" to-port="1" /> + <edge from-layer="124" from-port="2" to-layer="126" to-port="0" /> + <edge from-layer="125" from-port="0" to-layer="126" to-port="1" /> + <edge from-layer="126" from-port="2" to-layer="128" to-port="0" /> + <edge from-layer="127" from-port="0" to-layer="128" to-port="1" /> + <edge from-layer="128" from-port="2" to-layer="146" to-port="0" /> + <edge from-layer="128" from-port="2" to-layer="140" to-port="0" /> + <edge from-layer="128" from-port="2" to-layer="130" to-port="0" /> + <edge from-layer="128" from-port="2" to-layer="129" to-port="0" /> + <edge from-layer="129" from-port="2" to-layer="149" to-port="0" /> + <edge from-layer="130" from-port="1" to-layer="132" to-port="0" /> + <edge from-layer="131" from-port="0" to-layer="132" to-port="2" /> + <edge from-layer="132" from-port="3" to-layer="133" to-port="0" /> + <edge from-layer="133" from-port="2" to-layer="134" to-port="0" /> + <edge from-layer="134" from-port="1" to-layer="136" to-port="0" /> + <edge from-layer="135" from-port="0" to-layer="136" to-port="1" /> + <edge from-layer="136" from-port="2" to-layer="140" to-port="1" /> + <edge from-layer="136" from-port="2" to-layer="146" to-port="2" /> + <edge from-layer="137" from-port="0" to-layer="140" to-port="2" /> + <edge from-layer="138" from-port="0" to-layer="140" to-port="3" /> + <edge from-layer="139" from-port="0" to-layer="140" to-port="4" /> + <edge from-layer="140" from-port="5" to-layer="142" to-port="0" /> + <edge from-layer="141" from-port="0" to-layer="142" to-port="1" /> + <edge from-layer="142" from-port="2" to-layer="147" to-port="0" /> + <edge from-layer="143" from-port="0" to-layer="146" to-port="1" /> + <edge from-layer="144" from-port="0" to-layer="146" to-port="3" /> + <edge from-layer="145" from-port="0" to-layer="146" to-port="4" /> + <edge from-layer="146" from-port="5" to-layer="147" to-port="1" /> + <edge from-layer="147" from-port="2" to-layer="148" to-port="0" /> + <edge from-layer="148" from-port="2" to-layer="149" to-port="1" /> + <edge from-layer="149" from-port="2" to-layer="150" to-port="1" /> + <edge from-layer="149" from-port="2" to-layer="307" to-port="0" /> + <edge from-layer="150" from-port="2" to-layer="152" to-port="0" /> + <edge from-layer="150" from-port="2" to-layer="157" to-port="0" /> + <edge from-layer="150" from-port="2" to-layer="11226" to-port="0" /> + <edge from-layer="151" from-port="0" to-layer="10739" to-port="1" /> + <edge from-layer="151" from-port="0" to-layer="5635" to-port="1" /> + <edge from-layer="151" from-port="0" to-layer="712" to-port="1" /> + <edge from-layer="151" from-port="0" to-layer="9811" to-port="1" /> + <edge from-layer="151" from-port="0" to-layer="944" to-port="1" /> + <edge from-layer="151" from-port="0" to-layer="11280" to-port="1" /> + <edge from-layer="151" from-port="0" to-layer="11267" to-port="1" /> + <edge from-layer="151" from-port="0" to-layer="10971" to-port="1" /> + <edge from-layer="151" from-port="0" to-layer="10930" to-port="1" /> + <edge from-layer="151" from-port="0" to-layer="10234" to-port="1" /> + <edge from-layer="151" from-port="0" to-layer="10698" to-port="1" /> + <edge from-layer="151" from-port="0" to-layer="10507" to-port="1" /> + <edge from-layer="151" from-port="0" to-layer="291" to-port="1" /> + <edge from-layer="151" from-port="0" to-layer="10002" to-port="1" /> + <edge from-layer="151" from-port="0" to-layer="10043" to-port="1" /> + <edge from-layer="151" from-port="0" to-layer="10466" to-port="1" /> + <edge from-layer="151" from-port="0" to-layer="10275" to-port="1" /> + <edge from-layer="151" from-port="0" to-layer="8651" to-port="1" /> + <edge from-layer="151" from-port="0" to-layer="6058" to-port="1" /> + <edge from-layer="151" from-port="0" to-layer="197" to-port="1" /> + <edge from-layer="151" from-port="0" to-layer="7914" to-port="1" /> + <edge from-layer="151" from-port="0" to-layer="7955" to-port="1" /> + <edge from-layer="151" from-port="0" to-layer="8146" to-port="1" /> + <edge from-layer="151" from-port="0" to-layer="8187" to-port="1" /> + <edge from-layer="151" from-port="0" to-layer="8378" to-port="1" /> + <edge from-layer="151" from-port="0" to-layer="8419" to-port="1" /> + <edge from-layer="151" from-port="0" to-layer="753" to-port="1" /> + <edge from-layer="151" from-port="0" to-layer="8610" to-port="1" /> + <edge from-layer="151" from-port="0" to-layer="9770" to-port="1" /> + <edge from-layer="151" from-port="0" to-layer="8842" to-port="1" /> + <edge from-layer="151" from-port="0" to-layer="8883" to-port="1" /> + <edge from-layer="151" from-port="0" to-layer="5867" to-port="1" /> + <edge from-layer="151" from-port="0" to-layer="9074" to-port="1" /> + <edge from-layer="151" from-port="0" to-layer="9115" to-port="1" /> + <edge from-layer="151" from-port="0" to-layer="9306" to-port="1" /> + <edge from-layer="151" from-port="0" to-layer="9347" to-port="1" /> + <edge from-layer="151" from-port="0" to-layer="9538" to-port="1" /> + <edge from-layer="151" from-port="0" to-layer="9579" to-port="1" /> + <edge from-layer="151" from-port="0" to-layer="5826" to-port="1" /> + <edge from-layer="151" from-port="0" to-layer="2104" to-port="1" /> + <edge from-layer="151" from-port="0" to-layer="3083" to-port="1" /> + <edge from-layer="151" from-port="0" to-layer="3042" to-port="1" /> + <edge from-layer="151" from-port="0" to-layer="2851" to-port="1" /> + <edge from-layer="151" from-port="0" to-layer="480" to-port="1" /> + <edge from-layer="151" from-port="0" to-layer="2810" to-port="1" /> + <edge from-layer="151" from-port="0" to-layer="2619" to-port="1" /> + <edge from-layer="151" from-port="0" to-layer="2578" to-port="1" /> + <edge from-layer="151" from-port="0" to-layer="2387" to-port="1" /> + <edge from-layer="151" from-port="0" to-layer="2374" to-port="1" /> + <edge from-layer="151" from-port="0" to-layer="2145" to-port="1" /> + <edge from-layer="151" from-port="0" to-layer="3274" to-port="1" /> + <edge from-layer="151" from-port="0" to-layer="1176" to-port="1" /> + <edge from-layer="151" from-port="0" to-layer="521" to-port="1" /> + <edge from-layer="151" from-port="0" to-layer="1913" to-port="1" /> + <edge from-layer="151" from-port="0" to-layer="1872" to-port="1" /> + <edge from-layer="151" from-port="0" to-layer="1681" to-port="1" /> + <edge from-layer="151" from-port="0" to-layer="1640" to-port="1" /> + <edge from-layer="151" from-port="0" to-layer="1449" to-port="1" /> + <edge from-layer="151" from-port="0" to-layer="1217" to-port="1" /> + <edge from-layer="151" from-port="0" to-layer="1408" to-port="1" /> + <edge from-layer="151" from-port="0" to-layer="4434" to-port="1" /> + <edge from-layer="151" from-port="0" to-layer="5403" to-port="1" /> + <edge from-layer="151" from-port="0" to-layer="5362" to-port="1" /> + <edge from-layer="151" from-port="0" to-layer="5171" to-port="1" /> + <edge from-layer="151" from-port="0" to-layer="5130" to-port="1" /> + <edge from-layer="151" from-port="0" to-layer="985" to-port="1" /> + <edge from-layer="151" from-port="0" to-layer="4939" to-port="1" /> + <edge from-layer="151" from-port="0" to-layer="4898" to-port="1" /> + <edge from-layer="151" from-port="0" to-layer="4707" to-port="1" /> + <edge from-layer="151" from-port="0" to-layer="4666" to-port="1" /> + <edge from-layer="151" from-port="0" to-layer="4475" to-port="1" /> + <edge from-layer="151" from-port="0" to-layer="5594" to-port="1" /> + <edge from-layer="151" from-port="0" to-layer="4243" to-port="1" /> + <edge from-layer="151" from-port="0" to-layer="4202" to-port="1" /> + <edge from-layer="151" from-port="0" to-layer="4011" to-port="1" /> + <edge from-layer="151" from-port="0" to-layer="3970" to-port="1" /> + <edge from-layer="151" from-port="0" to-layer="3779" to-port="1" /> + <edge from-layer="151" from-port="0" to-layer="3738" to-port="1" /> + <edge from-layer="151" from-port="0" to-layer="3547" to-port="1" /> + <edge from-layer="151" from-port="0" to-layer="3506" to-port="1" /> + <edge from-layer="151" from-port="0" to-layer="3315" to-port="1" /> + <edge from-layer="151" from-port="0" to-layer="7682" to-port="1" /> + <edge from-layer="151" from-port="0" to-layer="6986" to-port="1" /> + <edge from-layer="151" from-port="0" to-layer="6795" to-port="1" /> + <edge from-layer="151" from-port="0" to-layer="6754" to-port="1" /> + <edge from-layer="151" from-port="0" to-layer="7027" to-port="1" /> + <edge from-layer="151" from-port="0" to-layer="152" to-port="1" /> + <edge from-layer="151" from-port="0" to-layer="7450" to-port="1" /> + <edge from-layer="151" from-port="0" to-layer="6563" to-port="1" /> + <edge from-layer="151" from-port="0" to-layer="6099" to-port="1" /> + <edge from-layer="151" from-port="0" to-layer="6522" to-port="1" /> + <edge from-layer="151" from-port="0" to-layer="7491" to-port="1" /> + <edge from-layer="151" from-port="0" to-layer="7218" to-port="1" /> + <edge from-layer="151" from-port="0" to-layer="6290" to-port="1" /> + <edge from-layer="151" from-port="0" to-layer="6331" to-port="1" /> + <edge from-layer="151" from-port="0" to-layer="7259" to-port="1" /> + <edge from-layer="151" from-port="0" to-layer="7723" to-port="1" /> + <edge from-layer="152" from-port="2" to-layer="166" to-port="0" /> + <edge from-layer="153" from-port="1" to-layer="255" to-port="0" /> + <edge from-layer="153" from-port="1" to-layer="156" to-port="0" /> + <edge from-layer="154" from-port="0" to-layer="156" to-port="1" /> + <edge from-layer="155" from-port="0" to-layer="156" to-port="2" /> + <edge from-layer="156" from-port="3" to-layer="165" to-port="0" /> + <edge from-layer="157" from-port="1" to-layer="160" to-port="0" /> + <edge from-layer="157" from-port="1" to-layer="164" to-port="0" /> + <edge from-layer="158" from-port="0" to-layer="160" to-port="1" /> + <edge from-layer="159" from-port="0" to-layer="160" to-port="2" /> + <edge from-layer="160" from-port="3" to-layer="165" to-port="1" /> + <edge from-layer="161" from-port="0" to-layer="165" to-port="2" /> + <edge from-layer="162" from-port="0" to-layer="164" to-port="1" /> + <edge from-layer="163" from-port="0" to-layer="164" to-port="2" /> + <edge from-layer="164" from-port="3" to-layer="165" to-port="3" /> + <edge from-layer="165" from-port="4" to-layer="166" to-port="1" /> + <edge from-layer="166" from-port="2" to-layer="168" to-port="0" /> + <edge from-layer="167" from-port="0" to-layer="168" to-port="1" /> + <edge from-layer="168" from-port="2" to-layer="315" to-port="1" /> + <edge from-layer="169" from-port="0" to-layer="174" to-port="0" /> + <edge from-layer="170" from-port="0" to-layer="173" to-port="1" /> + <edge from-layer="171" from-port="0" to-layer="173" to-port="2" /> + <edge from-layer="172" from-port="0" to-layer="173" to-port="3" /> + <edge from-layer="173" from-port="4" to-layer="174" to-port="1" /> + <edge from-layer="174" from-port="2" to-layer="175" to-port="0" /> + <edge from-layer="175" from-port="1" to-layer="177" to-port="0" /> + <edge from-layer="176" from-port="0" to-layer="177" to-port="2" /> + <edge from-layer="177" from-port="3" to-layer="196" to-port="0" /> + <edge from-layer="178" from-port="0" to-layer="179" to-port="0" /> + <edge from-layer="179" from-port="1" to-layer="182" to-port="0" /> + <edge from-layer="180" from-port="0" to-layer="181" to-port="0" /> + <edge from-layer="181" from-port="1" to-layer="182" to-port="1" /> + <edge from-layer="182" from-port="2" to-layer="184" to-port="0" /> + <edge from-layer="183" from-port="0" to-layer="184" to-port="1" /> + <edge from-layer="184" from-port="2" to-layer="186" to-port="0" /> + <edge from-layer="185" from-port="0" to-layer="186" to-port="1" /> + <edge from-layer="186" from-port="2" to-layer="187" to-port="0" /> + <edge from-layer="187" from-port="1" to-layer="188" to-port="1" /> + <edge from-layer="188" from-port="2" to-layer="191" to-port="0" /> + <edge from-layer="189" from-port="0" to-layer="190" to-port="0" /> + <edge from-layer="190" from-port="1" to-layer="191" to-port="1" /> + <edge from-layer="191" from-port="2" to-layer="193" to-port="0" /> + <edge from-layer="192" from-port="0" to-layer="193" to-port="1" /> + <edge from-layer="193" from-port="2" to-layer="195" to-port="0" /> + <edge from-layer="194" from-port="0" to-layer="195" to-port="1" /> + <edge from-layer="195" from-port="2" to-layer="196" to-port="1" /> + <edge from-layer="196" from-port="2" to-layer="11225" to-port="0" /> + <edge from-layer="196" from-port="2" to-layer="197" to-port="0" /> + <edge from-layer="196" from-port="2" to-layer="202" to-port="0" /> + <edge from-layer="197" from-port="2" to-layer="211" to-port="0" /> + <edge from-layer="198" from-port="1" to-layer="219" to-port="0" /> + <edge from-layer="198" from-port="1" to-layer="201" to-port="0" /> + <edge from-layer="199" from-port="0" to-layer="201" to-port="1" /> + <edge from-layer="200" from-port="0" to-layer="201" to-port="2" /> + <edge from-layer="201" from-port="3" to-layer="2396" to-port="0" /> + <edge from-layer="201" from-port="3" to-layer="7732" to-port="0" /> + <edge from-layer="201" from-port="3" to-layer="6804" to-port="0" /> + <edge from-layer="201" from-port="3" to-layer="7268" to-port="0" /> + <edge from-layer="201" from-port="3" to-layer="2860" to-port="0" /> + <edge from-layer="201" from-port="3" to-layer="2628" to-port="0" /> + <edge from-layer="201" from-port="3" to-layer="11289" to-port="0" /> + <edge from-layer="201" from-port="3" to-layer="6572" to-port="0" /> + <edge from-layer="201" from-port="3" to-layer="5644" to-port="0" /> + <edge from-layer="201" from-port="3" to-layer="10284" to-port="0" /> + <edge from-layer="201" from-port="3" to-layer="2154" to-port="0" /> + <edge from-layer="201" from-port="3" to-layer="10052" to-port="0" /> + <edge from-layer="201" from-port="3" to-layer="6340" to-port="0" /> + <edge from-layer="201" from-port="3" to-layer="7500" to-port="0" /> + <edge from-layer="201" from-port="3" to-layer="9588" to-port="0" /> + <edge from-layer="201" from-port="3" to-layer="8428" to-port="0" /> + <edge from-layer="201" from-port="3" to-layer="270" to-port="0" /> + <edge from-layer="201" from-port="3" to-layer="1922" to-port="0" /> + <edge from-layer="201" from-port="3" to-layer="9356" to-port="0" /> + <edge from-layer="201" from-port="3" to-layer="6108" to-port="0" /> + <edge from-layer="201" from-port="3" to-layer="994" to-port="0" /> + <edge from-layer="201" from-port="3" to-layer="4948" to-port="0" /> + <edge from-layer="201" from-port="3" to-layer="1226" to-port="0" /> + <edge from-layer="201" from-port="3" to-layer="7964" to-port="0" /> + <edge from-layer="201" from-port="3" to-layer="4716" to-port="0" /> + <edge from-layer="201" from-port="3" to-layer="4484" to-port="0" /> + <edge from-layer="201" from-port="3" to-layer="10980" to-port="0" /> + <edge from-layer="201" from-port="3" to-layer="4252" to-port="0" /> + <edge from-layer="201" from-port="3" to-layer="10748" to-port="0" /> + <edge from-layer="201" from-port="3" to-layer="210" to-port="0" /> + <edge from-layer="201" from-port="3" to-layer="4020" to-port="0" /> + <edge from-layer="201" from-port="3" to-layer="3092" to-port="0" /> + <edge from-layer="201" from-port="3" to-layer="5180" to-port="0" /> + <edge from-layer="201" from-port="3" to-layer="3788" to-port="0" /> + <edge from-layer="201" from-port="3" to-layer="1458" to-port="0" /> + <edge from-layer="201" from-port="3" to-layer="3556" to-port="0" /> + <edge from-layer="201" from-port="3" to-layer="7036" to-port="0" /> + <edge from-layer="201" from-port="3" to-layer="10516" to-port="0" /> + <edge from-layer="201" from-port="3" to-layer="3324" to-port="0" /> + <edge from-layer="201" from-port="3" to-layer="9820" to-port="0" /> + <edge from-layer="201" from-port="3" to-layer="8196" to-port="0" /> + <edge from-layer="201" from-port="3" to-layer="5412" to-port="0" /> + <edge from-layer="201" from-port="3" to-layer="9124" to-port="0" /> + <edge from-layer="201" from-port="3" to-layer="762" to-port="0" /> + <edge from-layer="201" from-port="3" to-layer="1690" to-port="0" /> + <edge from-layer="201" from-port="3" to-layer="5876" to-port="0" /> + <edge from-layer="201" from-port="3" to-layer="530" to-port="0" /> + <edge from-layer="201" from-port="3" to-layer="8892" to-port="0" /> + <edge from-layer="201" from-port="3" to-layer="8660" to-port="0" /> + <edge from-layer="202" from-port="1" to-layer="209" to-port="0" /> + <edge from-layer="202" from-port="1" to-layer="205" to-port="0" /> + <edge from-layer="203" from-port="0" to-layer="205" to-port="1" /> + <edge from-layer="204" from-port="0" to-layer="205" to-port="2" /> + <edge from-layer="205" from-port="3" to-layer="210" to-port="1" /> + <edge from-layer="206" from-port="0" to-layer="210" to-port="2" /> + <edge from-layer="207" from-port="0" to-layer="209" to-port="1" /> + <edge from-layer="208" from-port="0" to-layer="209" to-port="2" /> + <edge from-layer="209" from-port="3" to-layer="210" to-port="3" /> + <edge from-layer="210" from-port="4" to-layer="211" to-port="1" /> + <edge from-layer="211" from-port="2" to-layer="213" to-port="0" /> + <edge from-layer="212" from-port="0" to-layer="213" to-port="1" /> + <edge from-layer="213" from-port="2" to-layer="315" to-port="2" /> + <edge from-layer="214" from-port="0" to-layer="236" to-port="0" /> + <edge from-layer="214" from-port="0" to-layer="237" to-port="1" /> + <edge from-layer="215" from-port="0" to-layer="230" to-port="0" /> + <edge from-layer="216" from-port="0" to-layer="229" to-port="0" /> + <edge from-layer="217" from-port="0" to-layer="219" to-port="1" /> + <edge from-layer="218" from-port="0" to-layer="219" to-port="2" /> + <edge from-layer="219" from-port="3" to-layer="256" to-port="1" /> + <edge from-layer="219" from-port="3" to-layer="221" to-port="0" /> + <edge from-layer="220" from-port="0" to-layer="221" to-port="1" /> + <edge from-layer="221" from-port="2" to-layer="228" to-port="0" /> + <edge from-layer="222" from-port="1" to-layer="225" to-port="0" /> + <edge from-layer="223" from-port="0" to-layer="225" to-port="1" /> + <edge from-layer="224" from-port="0" to-layer="225" to-port="2" /> + <edge from-layer="225" from-port="3" to-layer="227" to-port="0" /> + <edge from-layer="225" from-port="3" to-layer="250" to-port="1" /> + <edge from-layer="226" from-port="0" to-layer="227" to-port="1" /> + <edge from-layer="227" from-port="2" to-layer="289" to-port="2" /> + <edge from-layer="227" from-port="2" to-layer="283" to-port="2" /> + <edge from-layer="227" from-port="2" to-layer="228" to-port="1" /> + <edge from-layer="228" from-port="2" to-layer="229" to-port="1" /> + <edge from-layer="229" from-port="2" to-layer="230" to-port="1" /> + <edge from-layer="230" from-port="2" to-layer="231" to-port="0" /> + <edge from-layer="230" from-port="2" to-layer="247" to-port="1" /> + <edge from-layer="231" from-port="1" to-layer="234" to-port="0" /> + <edge from-layer="231" from-port="1" to-layer="241" to-port="0" /> + <edge from-layer="232" from-port="0" to-layer="234" to-port="1" /> + <edge from-layer="233" from-port="0" to-layer="234" to-port="2" /> + <edge from-layer="234" from-port="3" to-layer="236" to-port="1" /> + <edge from-layer="235" from-port="0" to-layer="244" to-port="1" /> + <edge from-layer="235" from-port="0" to-layer="243" to-port="2" /> + <edge from-layer="235" from-port="0" to-layer="236" to-port="2" /> + <edge from-layer="236" from-port="3" to-layer="237" to-port="0" /> + <edge from-layer="237" from-port="2" to-layer="245" to-port="0" /> + <edge from-layer="238" from-port="0" to-layer="243" to-port="0" /> + <edge from-layer="238" from-port="0" to-layer="242" to-port="1" /> + <edge from-layer="239" from-port="0" to-layer="241" to-port="1" /> + <edge from-layer="240" from-port="0" to-layer="241" to-port="2" /> + <edge from-layer="241" from-port="3" to-layer="242" to-port="0" /> + <edge from-layer="242" from-port="2" to-layer="243" to-port="1" /> + <edge from-layer="243" from-port="3" to-layer="244" to-port="0" /> + <edge from-layer="244" from-port="2" to-layer="245" to-port="1" /> + <edge from-layer="245" from-port="2" to-layer="247" to-port="0" /> + <edge from-layer="246" from-port="0" to-layer="247" to-port="2" /> + <edge from-layer="247" from-port="3" to-layer="263" to-port="0" /> + <edge from-layer="248" from-port="0" to-layer="250" to-port="0" /> + <edge from-layer="249" from-port="0" to-layer="250" to-port="2" /> + <edge from-layer="250" from-port="3" to-layer="251" to-port="0" /> + <edge from-layer="251" from-port="1" to-layer="252" to-port="0" /> + <edge from-layer="252" from-port="1" to-layer="261" to-port="0" /> + <edge from-layer="253" from-port="0" to-layer="255" to-port="1" /> + <edge from-layer="254" from-port="0" to-layer="255" to-port="2" /> + <edge from-layer="255" from-port="3" to-layer="258" to-port="0" /> + <edge from-layer="255" from-port="3" to-layer="256" to-port="0" /> + <edge from-layer="255" from-port="3" to-layer="306" to-port="0" /> + <edge from-layer="256" from-port="2" to-layer="258" to-port="1" /> + <edge from-layer="257" from-port="0" to-layer="258" to-port="2" /> + <edge from-layer="258" from-port="3" to-layer="260" to-port="0" /> + <edge from-layer="259" from-port="0" to-layer="260" to-port="1" /> + <edge from-layer="260" from-port="2" to-layer="261" to-port="1" /> + <edge from-layer="261" from-port="2" to-layer="262" to-port="0" /> + <edge from-layer="262" from-port="1" to-layer="263" to-port="1" /> + <edge from-layer="263" from-port="2" to-layer="265" to-port="0" /> + <edge from-layer="264" from-port="0" to-layer="265" to-port="1" /> + <edge from-layer="265" from-port="2" to-layer="266" to-port="0" /> + <edge from-layer="266" from-port="2" to-layer="271" to-port="0" /> + <edge from-layer="267" from-port="0" to-layer="270" to-port="1" /> + <edge from-layer="268" from-port="0" to-layer="270" to-port="2" /> + <edge from-layer="269" from-port="0" to-layer="270" to-port="3" /> + <edge from-layer="270" from-port="4" to-layer="271" to-port="1" /> + <edge from-layer="271" from-port="2" to-layer="273" to-port="0" /> + <edge from-layer="271" from-port="2" to-layer="289" to-port="0" /> + <edge from-layer="271" from-port="2" to-layer="275" to-port="0" /> + <edge from-layer="272" from-port="0" to-layer="273" to-port="1" /> + <edge from-layer="273" from-port="2" to-layer="302" to-port="0" /> + <edge from-layer="274" from-port="0" to-layer="276" to-port="1" /> + <edge from-layer="274" from-port="0" to-layer="278" to-port="0" /> + <edge from-layer="275" from-port="1" to-layer="276" to-port="0" /> + <edge from-layer="275" from-port="1" to-layer="279" to-port="1" /> + <edge from-layer="275" from-port="1" to-layer="303" to-port="1" /> + <edge from-layer="276" from-port="2" to-layer="278" to-port="1" /> + <edge from-layer="277" from-port="0" to-layer="278" to-port="2" /> + <edge from-layer="278" from-port="3" to-layer="279" to-port="0" /> + <edge from-layer="279" from-port="2" to-layer="283" to-port="0" /> + <edge from-layer="280" from-port="0" to-layer="283" to-port="1" /> + <edge from-layer="281" from-port="0" to-layer="283" to-port="3" /> + <edge from-layer="282" from-port="0" to-layer="283" to-port="4" /> + <edge from-layer="283" from-port="5" to-layer="285" to-port="0" /> + <edge from-layer="284" from-port="0" to-layer="285" to-port="1" /> + <edge from-layer="285" from-port="2" to-layer="302" to-port="1" /> + <edge from-layer="286" from-port="0" to-layer="289" to-port="1" /> + <edge from-layer="287" from-port="0" to-layer="289" to-port="3" /> + <edge from-layer="288" from-port="0" to-layer="289" to-port="4" /> + <edge from-layer="289" from-port="5" to-layer="298" to-port="0" /> + <edge from-layer="289" from-port="5" to-layer="297" to-port="2" /> + <edge from-layer="289" from-port="5" to-layer="293" to-port="0" /> + <edge from-layer="290" from-port="2" to-layer="291" to-port="0" /> + <edge from-layer="291" from-port="2" to-layer="292" to-port="0" /> + <edge from-layer="292" from-port="1" to-layer="293" to-port="1" /> + <edge from-layer="293" from-port="2" to-layer="295" to-port="0" /> + <edge from-layer="294" from-port="0" to-layer="295" to-port="1" /> + <edge from-layer="295" from-port="2" to-layer="297" to-port="0" /> + <edge from-layer="296" from-port="0" to-layer="297" to-port="1" /> + <edge from-layer="297" from-port="3" to-layer="299" to-port="0" /> + <edge from-layer="298" from-port="1" to-layer="299" to-port="1" /> + <edge from-layer="299" from-port="2" to-layer="301" to-port="0" /> + <edge from-layer="300" from-port="0" to-layer="301" to-port="1" /> + <edge from-layer="301" from-port="2" to-layer="302" to-port="2" /> + <edge from-layer="302" from-port="3" to-layer="303" to-port="0" /> + <edge from-layer="303" from-port="2" to-layer="7284" to-port="0" /> + <edge from-layer="303" from-port="2" to-layer="5428" to-port="0" /> + <edge from-layer="303" from-port="2" to-layer="11305" to-port="0" /> + <edge from-layer="303" from-port="2" to-layer="5196" to-port="0" /> + <edge from-layer="303" from-port="2" to-layer="5660" to-port="0" /> + <edge from-layer="303" from-port="2" to-layer="1242" to-port="0" /> + <edge from-layer="303" from-port="2" to-layer="6820" to-port="0" /> + <edge from-layer="303" from-port="2" to-layer="6124" to-port="0" /> + <edge from-layer="303" from-port="2" to-layer="1706" to-port="0" /> + <edge from-layer="303" from-port="2" to-layer="546" to-port="0" /> + <edge from-layer="303" from-port="2" to-layer="1938" to-port="0" /> + <edge from-layer="303" from-port="2" to-layer="6356" to-port="0" /> + <edge from-layer="303" from-port="2" to-layer="2170" to-port="0" /> + <edge from-layer="303" from-port="2" to-layer="2412" to-port="0" /> + <edge from-layer="303" from-port="2" to-layer="6588" to-port="0" /> + <edge from-layer="303" from-port="2" to-layer="2644" to-port="0" /> + <edge from-layer="303" from-port="2" to-layer="2876" to-port="0" /> + <edge from-layer="303" from-port="2" to-layer="3108" to-port="0" /> + <edge from-layer="303" from-port="2" to-layer="4964" to-port="0" /> + <edge from-layer="303" from-port="2" to-layer="1474" to-port="0" /> + <edge from-layer="303" from-port="2" to-layer="3340" to-port="0" /> + <edge from-layer="303" from-port="2" to-layer="3572" to-port="0" /> + <edge from-layer="303" from-port="2" to-layer="3804" to-port="0" /> + <edge from-layer="303" from-port="2" to-layer="7052" to-port="0" /> + <edge from-layer="303" from-port="2" to-layer="4036" to-port="0" /> + <edge from-layer="303" from-port="2" to-layer="4268" to-port="0" /> + <edge from-layer="303" from-port="2" to-layer="4500" to-port="0" /> + <edge from-layer="303" from-port="2" to-layer="1010" to-port="0" /> + <edge from-layer="303" from-port="2" to-layer="4732" to-port="0" /> + <edge from-layer="303" from-port="2" to-layer="7748" to-port="0" /> + <edge from-layer="303" from-port="2" to-layer="314" to-port="0" /> + <edge from-layer="303" from-port="2" to-layer="10300" to-port="0" /> + <edge from-layer="303" from-port="2" to-layer="10068" to-port="0" /> + <edge from-layer="303" from-port="2" to-layer="9836" to-port="0" /> + <edge from-layer="303" from-port="2" to-layer="7516" to-port="0" /> + <edge from-layer="303" from-port="2" to-layer="9604" to-port="0" /> + <edge from-layer="303" from-port="2" to-layer="9372" to-port="0" /> + <edge from-layer="303" from-port="2" to-layer="9140" to-port="0" /> + <edge from-layer="303" from-port="2" to-layer="10532" to-port="0" /> + <edge from-layer="303" from-port="2" to-layer="778" to-port="0" /> + <edge from-layer="303" from-port="2" to-layer="8676" to-port="0" /> + <edge from-layer="303" from-port="2" to-layer="5892" to-port="0" /> + <edge from-layer="303" from-port="2" to-layer="8444" to-port="0" /> + <edge from-layer="303" from-port="2" to-layer="10996" to-port="0" /> + <edge from-layer="303" from-port="2" to-layer="10764" to-port="0" /> + <edge from-layer="303" from-port="2" to-layer="8212" to-port="0" /> + <edge from-layer="303" from-port="2" to-layer="7980" to-port="0" /> + <edge from-layer="303" from-port="2" to-layer="8908" to-port="0" /> + <edge from-layer="304" from-port="0" to-layer="314" to-port="1" /> + <edge from-layer="305" from-port="0" to-layer="306" to-port="1" /> + <edge from-layer="306" from-port="2" to-layer="311" to-port="0" /> + <edge from-layer="307" from-port="1" to-layer="310" to-port="0" /> + <edge from-layer="308" from-port="0" to-layer="310" to-port="1" /> + <edge from-layer="309" from-port="0" to-layer="310" to-port="2" /> + <edge from-layer="310" from-port="3" to-layer="311" to-port="1" /> + <edge from-layer="311" from-port="2" to-layer="314" to-port="2" /> + <edge from-layer="312" from-port="0" to-layer="314" to-port="3" /> + <edge from-layer="313" from-port="0" to-layer="314" to-port="4" /> + <edge from-layer="314" from-port="5" to-layer="315" to-port="3" /> + <edge from-layer="315" from-port="4" to-layer="317" to-port="0" /> + <edge from-layer="316" from-port="0" to-layer="317" to-port="1" /> + <edge from-layer="317" from-port="2" to-layer="319" to-port="0" /> + <edge from-layer="318" from-port="0" to-layer="319" to-port="1" /> + <edge from-layer="319" from-port="2" to-layer="330" to-port="0" /> + <edge from-layer="320" from-port="0" to-layer="321" to-port="0" /> + <edge from-layer="321" from-port="1" to-layer="324" to-port="0" /> + <edge from-layer="322" from-port="0" to-layer="323" to-port="0" /> + <edge from-layer="323" from-port="1" to-layer="324" to-port="1" /> + <edge from-layer="324" from-port="2" to-layer="326" to-port="0" /> + <edge from-layer="325" from-port="0" to-layer="326" to-port="1" /> + <edge from-layer="326" from-port="2" to-layer="328" to-port="0" /> + <edge from-layer="327" from-port="0" to-layer="328" to-port="1" /> + <edge from-layer="328" from-port="2" to-layer="329" to-port="0" /> + <edge from-layer="329" from-port="1" to-layer="330" to-port="1" /> + <edge from-layer="330" from-port="2" to-layer="331" to-port="1" /> + <edge from-layer="331" from-port="2" to-layer="342" to-port="0" /> + <edge from-layer="331" from-port="2" to-layer="335" to-port="0" /> + <edge from-layer="331" from-port="2" to-layer="379" to-port="0" /> + <edge from-layer="332" from-port="0" to-layer="343" to-port="0" /> + <edge from-layer="333" from-port="0" to-layer="341" to-port="0" /> + <edge from-layer="334" from-port="0" to-layer="335" to-port="1" /> + <edge from-layer="335" from-port="2" to-layer="337" to-port="0" /> + <edge from-layer="336" from-port="0" to-layer="337" to-port="1" /> + <edge from-layer="337" from-port="2" to-layer="339" to-port="0" /> + <edge from-layer="338" from-port="0" to-layer="339" to-port="1" /> + <edge from-layer="339" from-port="2" to-layer="340" to-port="0" /> + <edge from-layer="340" from-port="1" to-layer="341" to-port="1" /> + <edge from-layer="341" from-port="2" to-layer="342" to-port="1" /> + <edge from-layer="342" from-port="2" to-layer="343" to-port="1" /> + <edge from-layer="343" from-port="2" to-layer="354" to-port="0" /> + <edge from-layer="343" from-port="2" to-layer="366" to-port="0" /> + <edge from-layer="344" from-port="0" to-layer="345" to-port="0" /> + <edge from-layer="345" from-port="1" to-layer="348" to-port="0" /> + <edge from-layer="346" from-port="0" to-layer="347" to-port="0" /> + <edge from-layer="347" from-port="1" to-layer="348" to-port="1" /> + <edge from-layer="348" from-port="2" to-layer="350" to-port="0" /> + <edge from-layer="349" from-port="0" to-layer="350" to-port="1" /> + <edge from-layer="350" from-port="2" to-layer="352" to-port="0" /> + <edge from-layer="351" from-port="0" to-layer="352" to-port="1" /> + <edge from-layer="352" from-port="2" to-layer="353" to-port="0" /> + <edge from-layer="353" from-port="1" to-layer="354" to-port="1" /> + <edge from-layer="354" from-port="2" to-layer="355" to-port="0" /> + <edge from-layer="355" from-port="1" to-layer="367" to-port="0" /> + <edge from-layer="356" from-port="0" to-layer="357" to-port="0" /> + <edge from-layer="357" from-port="1" to-layer="360" to-port="0" /> + <edge from-layer="358" from-port="0" to-layer="359" to-port="0" /> + <edge from-layer="359" from-port="1" to-layer="360" to-port="1" /> + <edge from-layer="360" from-port="2" to-layer="362" to-port="0" /> + <edge from-layer="361" from-port="0" to-layer="362" to-port="1" /> + <edge from-layer="362" from-port="2" to-layer="364" to-port="0" /> + <edge from-layer="363" from-port="0" to-layer="364" to-port="1" /> + <edge from-layer="364" from-port="2" to-layer="365" to-port="0" /> + <edge from-layer="365" from-port="1" to-layer="366" to-port="1" /> + <edge from-layer="366" from-port="2" to-layer="367" to-port="1" /> + <edge from-layer="367" from-port="2" to-layer="378" to-port="0" /> + <edge from-layer="368" from-port="0" to-layer="369" to-port="0" /> + <edge from-layer="369" from-port="1" to-layer="372" to-port="0" /> + <edge from-layer="370" from-port="0" to-layer="371" to-port="0" /> + <edge from-layer="371" from-port="1" to-layer="372" to-port="1" /> + <edge from-layer="372" from-port="2" to-layer="374" to-port="0" /> + <edge from-layer="373" from-port="0" to-layer="374" to-port="1" /> + <edge from-layer="374" from-port="2" to-layer="376" to-port="0" /> + <edge from-layer="375" from-port="0" to-layer="376" to-port="1" /> + <edge from-layer="376" from-port="2" to-layer="377" to-port="0" /> + <edge from-layer="377" from-port="1" to-layer="378" to-port="1" /> + <edge from-layer="378" from-port="2" to-layer="379" to-port="1" /> + <edge from-layer="379" from-port="2" to-layer="383" to-port="0" /> + <edge from-layer="379" from-port="2" to-layer="563" to-port="0" /> + <edge from-layer="379" from-port="2" to-layer="390" to-port="0" /> + <edge from-layer="380" from-port="0" to-layer="391" to-port="0" /> + <edge from-layer="381" from-port="0" to-layer="389" to-port="0" /> + <edge from-layer="382" from-port="0" to-layer="383" to-port="1" /> + <edge from-layer="383" from-port="2" to-layer="385" to-port="0" /> + <edge from-layer="384" from-port="0" to-layer="385" to-port="1" /> + <edge from-layer="385" from-port="2" to-layer="387" to-port="0" /> + <edge from-layer="386" from-port="0" to-layer="387" to-port="1" /> + <edge from-layer="387" from-port="2" to-layer="388" to-port="0" /> + <edge from-layer="388" from-port="1" to-layer="389" to-port="1" /> + <edge from-layer="389" from-port="2" to-layer="390" to-port="1" /> + <edge from-layer="390" from-port="2" to-layer="391" to-port="1" /> + <edge from-layer="391" from-port="2" to-layer="450" to-port="0" /> + <edge from-layer="391" from-port="2" to-layer="402" to-port="0" /> + <edge from-layer="391" from-port="2" to-layer="512" to-port="0" /> + <edge from-layer="392" from-port="0" to-layer="393" to-port="0" /> + <edge from-layer="393" from-port="1" to-layer="396" to-port="0" /> + <edge from-layer="394" from-port="0" to-layer="395" to-port="0" /> + <edge from-layer="395" from-port="1" to-layer="396" to-port="1" /> + <edge from-layer="396" from-port="2" to-layer="398" to-port="0" /> + <edge from-layer="397" from-port="0" to-layer="398" to-port="1" /> + <edge from-layer="398" from-port="2" to-layer="400" to-port="0" /> + <edge from-layer="399" from-port="0" to-layer="400" to-port="1" /> + <edge from-layer="400" from-port="2" to-layer="401" to-port="0" /> + <edge from-layer="401" from-port="1" to-layer="402" to-port="1" /> + <edge from-layer="402" from-port="2" to-layer="405" to-port="0" /> + <edge from-layer="403" from-port="0" to-layer="404" to-port="0" /> + <edge from-layer="404" from-port="1" to-layer="405" to-port="1" /> + <edge from-layer="405" from-port="2" to-layer="407" to-port="0" /> + <edge from-layer="406" from-port="0" to-layer="407" to-port="1" /> + <edge from-layer="407" from-port="2" to-layer="409" to-port="0" /> + <edge from-layer="408" from-port="0" to-layer="409" to-port="1" /> + <edge from-layer="409" from-port="2" to-layer="411" to-port="0" /> + <edge from-layer="409" from-port="2" to-layer="427" to-port="0" /> + <edge from-layer="409" from-port="2" to-layer="421" to-port="0" /> + <edge from-layer="409" from-port="2" to-layer="410" to-port="0" /> + <edge from-layer="410" from-port="2" to-layer="430" to-port="0" /> + <edge from-layer="411" from-port="1" to-layer="413" to-port="0" /> + <edge from-layer="412" from-port="0" to-layer="413" to-port="2" /> + <edge from-layer="413" from-port="3" to-layer="414" to-port="0" /> + <edge from-layer="414" from-port="2" to-layer="415" to-port="0" /> + <edge from-layer="415" from-port="1" to-layer="417" to-port="0" /> + <edge from-layer="416" from-port="0" to-layer="417" to-port="1" /> + <edge from-layer="417" from-port="2" to-layer="427" to-port="2" /> + <edge from-layer="417" from-port="2" to-layer="421" to-port="1" /> + <edge from-layer="418" from-port="0" to-layer="421" to-port="2" /> + <edge from-layer="419" from-port="0" to-layer="421" to-port="3" /> + <edge from-layer="420" from-port="0" to-layer="421" to-port="4" /> + <edge from-layer="421" from-port="5" to-layer="423" to-port="0" /> + <edge from-layer="422" from-port="0" to-layer="423" to-port="1" /> + <edge from-layer="423" from-port="2" to-layer="428" to-port="0" /> + <edge from-layer="424" from-port="0" to-layer="427" to-port="1" /> + <edge from-layer="425" from-port="0" to-layer="427" to-port="3" /> + <edge from-layer="426" from-port="0" to-layer="427" to-port="4" /> + <edge from-layer="427" from-port="5" to-layer="428" to-port="1" /> + <edge from-layer="428" from-port="2" to-layer="429" to-port="0" /> + <edge from-layer="429" from-port="2" to-layer="430" to-port="1" /> + <edge from-layer="430" from-port="2" to-layer="547" to-port="0" /> + <edge from-layer="431" from-port="0" to-layer="436" to-port="0" /> + <edge from-layer="432" from-port="0" to-layer="435" to-port="1" /> + <edge from-layer="433" from-port="0" to-layer="435" to-port="2" /> + <edge from-layer="434" from-port="0" to-layer="435" to-port="3" /> + <edge from-layer="435" from-port="4" to-layer="436" to-port="1" /> + <edge from-layer="436" from-port="2" to-layer="437" to-port="0" /> + <edge from-layer="437" from-port="1" to-layer="439" to-port="0" /> + <edge from-layer="438" from-port="0" to-layer="439" to-port="2" /> + <edge from-layer="439" from-port="3" to-layer="479" to-port="0" /> + <edge from-layer="439" from-port="3" to-layer="535" to-port="0" /> + <edge from-layer="440" from-port="0" to-layer="441" to-port="0" /> + <edge from-layer="441" from-port="1" to-layer="444" to-port="0" /> + <edge from-layer="442" from-port="0" to-layer="443" to-port="0" /> + <edge from-layer="443" from-port="1" to-layer="444" to-port="1" /> + <edge from-layer="444" from-port="2" to-layer="446" to-port="0" /> + <edge from-layer="445" from-port="0" to-layer="446" to-port="1" /> + <edge from-layer="446" from-port="2" to-layer="448" to-port="0" /> + <edge from-layer="447" from-port="0" to-layer="448" to-port="1" /> + <edge from-layer="448" from-port="2" to-layer="449" to-port="0" /> + <edge from-layer="449" from-port="1" to-layer="450" to-port="1" /> + <edge from-layer="450" from-port="2" to-layer="453" to-port="0" /> + <edge from-layer="451" from-port="0" to-layer="452" to-port="0" /> + <edge from-layer="452" from-port="1" to-layer="453" to-port="1" /> + <edge from-layer="453" from-port="2" to-layer="455" to-port="0" /> + <edge from-layer="454" from-port="0" to-layer="455" to-port="1" /> + <edge from-layer="455" from-port="2" to-layer="457" to-port="0" /> + <edge from-layer="456" from-port="0" to-layer="457" to-port="1" /> + <edge from-layer="457" from-port="2" to-layer="469" to-port="0" /> + <edge from-layer="457" from-port="2" to-layer="475" to-port="0" /> + <edge from-layer="457" from-port="2" to-layer="458" to-port="0" /> + <edge from-layer="457" from-port="2" to-layer="459" to-port="0" /> + <edge from-layer="458" from-port="2" to-layer="478" to-port="0" /> + <edge from-layer="459" from-port="1" to-layer="461" to-port="0" /> + <edge from-layer="460" from-port="0" to-layer="461" to-port="2" /> + <edge from-layer="461" from-port="3" to-layer="462" to-port="0" /> + <edge from-layer="462" from-port="2" to-layer="463" to-port="0" /> + <edge from-layer="463" from-port="1" to-layer="465" to-port="0" /> + <edge from-layer="464" from-port="0" to-layer="465" to-port="1" /> + <edge from-layer="465" from-port="2" to-layer="469" to-port="1" /> + <edge from-layer="465" from-port="2" to-layer="475" to-port="2" /> + <edge from-layer="466" from-port="0" to-layer="469" to-port="2" /> + <edge from-layer="467" from-port="0" to-layer="469" to-port="3" /> + <edge from-layer="468" from-port="0" to-layer="469" to-port="4" /> + <edge from-layer="469" from-port="5" to-layer="471" to-port="0" /> + <edge from-layer="470" from-port="0" to-layer="471" to-port="1" /> + <edge from-layer="471" from-port="2" to-layer="476" to-port="0" /> + <edge from-layer="472" from-port="0" to-layer="475" to-port="1" /> + <edge from-layer="473" from-port="0" to-layer="475" to-port="3" /> + <edge from-layer="474" from-port="0" to-layer="475" to-port="4" /> + <edge from-layer="475" from-port="5" to-layer="476" to-port="1" /> + <edge from-layer="476" from-port="2" to-layer="477" to-port="0" /> + <edge from-layer="477" from-port="2" to-layer="478" to-port="1" /> + <edge from-layer="478" from-port="2" to-layer="539" to-port="0" /> + <edge from-layer="478" from-port="2" to-layer="479" to-port="1" /> + <edge from-layer="479" from-port="2" to-layer="11224" to-port="0" /> + <edge from-layer="479" from-port="2" to-layer="480" to-port="0" /> + <edge from-layer="479" from-port="2" to-layer="481" to-port="0" /> + <edge from-layer="480" from-port="2" to-layer="490" to-port="0" /> + <edge from-layer="481" from-port="1" to-layer="484" to-port="0" /> + <edge from-layer="481" from-port="1" to-layer="488" to-port="0" /> + <edge from-layer="482" from-port="0" to-layer="484" to-port="1" /> + <edge from-layer="483" from-port="0" to-layer="484" to-port="2" /> + <edge from-layer="484" from-port="3" to-layer="489" to-port="0" /> + <edge from-layer="485" from-port="0" to-layer="489" to-port="1" /> + <edge from-layer="486" from-port="0" to-layer="488" to-port="1" /> + <edge from-layer="487" from-port="0" to-layer="488" to-port="2" /> + <edge from-layer="488" from-port="3" to-layer="489" to-port="2" /> + <edge from-layer="489" from-port="3" to-layer="490" to-port="1" /> + <edge from-layer="490" from-port="2" to-layer="492" to-port="0" /> + <edge from-layer="491" from-port="0" to-layer="492" to-port="1" /> + <edge from-layer="492" from-port="2" to-layer="547" to-port="1" /> + <edge from-layer="493" from-port="0" to-layer="498" to-port="0" /> + <edge from-layer="494" from-port="0" to-layer="497" to-port="1" /> + <edge from-layer="495" from-port="0" to-layer="497" to-port="2" /> + <edge from-layer="496" from-port="0" to-layer="497" to-port="3" /> + <edge from-layer="497" from-port="4" to-layer="498" to-port="1" /> + <edge from-layer="498" from-port="2" to-layer="499" to-port="0" /> + <edge from-layer="499" from-port="1" to-layer="501" to-port="0" /> + <edge from-layer="500" from-port="0" to-layer="501" to-port="2" /> + <edge from-layer="501" from-port="3" to-layer="520" to-port="0" /> + <edge from-layer="502" from-port="0" to-layer="503" to-port="0" /> + <edge from-layer="503" from-port="1" to-layer="506" to-port="0" /> + <edge from-layer="504" from-port="0" to-layer="505" to-port="0" /> + <edge from-layer="505" from-port="1" to-layer="506" to-port="1" /> + <edge from-layer="506" from-port="2" to-layer="508" to-port="0" /> + <edge from-layer="507" from-port="0" to-layer="508" to-port="1" /> + <edge from-layer="508" from-port="2" to-layer="510" to-port="0" /> + <edge from-layer="509" from-port="0" to-layer="510" to-port="1" /> + <edge from-layer="510" from-port="2" to-layer="511" to-port="0" /> + <edge from-layer="511" from-port="1" to-layer="512" to-port="1" /> + <edge from-layer="512" from-port="2" to-layer="515" to-port="0" /> + <edge from-layer="513" from-port="0" to-layer="514" to-port="0" /> + <edge from-layer="514" from-port="1" to-layer="515" to-port="1" /> + <edge from-layer="515" from-port="2" to-layer="517" to-port="0" /> + <edge from-layer="516" from-port="0" to-layer="517" to-port="1" /> + <edge from-layer="517" from-port="2" to-layer="519" to-port="0" /> + <edge from-layer="518" from-port="0" to-layer="519" to-port="1" /> + <edge from-layer="519" from-port="2" to-layer="520" to-port="1" /> + <edge from-layer="520" from-port="2" to-layer="521" to-port="0" /> + <edge from-layer="520" from-port="2" to-layer="522" to-port="0" /> + <edge from-layer="520" from-port="2" to-layer="11223" to-port="0" /> + <edge from-layer="521" from-port="2" to-layer="531" to-port="0" /> + <edge from-layer="522" from-port="1" to-layer="525" to-port="0" /> + <edge from-layer="522" from-port="1" to-layer="529" to-port="0" /> + <edge from-layer="523" from-port="0" to-layer="525" to-port="1" /> + <edge from-layer="524" from-port="0" to-layer="525" to-port="2" /> + <edge from-layer="525" from-port="3" to-layer="530" to-port="1" /> + <edge from-layer="526" from-port="0" to-layer="530" to-port="2" /> + <edge from-layer="527" from-port="0" to-layer="529" to-port="1" /> + <edge from-layer="528" from-port="0" to-layer="529" to-port="2" /> + <edge from-layer="529" from-port="3" to-layer="530" to-port="3" /> + <edge from-layer="530" from-port="4" to-layer="531" to-port="1" /> + <edge from-layer="531" from-port="2" to-layer="533" to-port="0" /> + <edge from-layer="532" from-port="0" to-layer="533" to-port="1" /> + <edge from-layer="533" from-port="2" to-layer="547" to-port="2" /> + <edge from-layer="534" from-port="0" to-layer="546" to-port="1" /> + <edge from-layer="535" from-port="1" to-layer="538" to-port="0" /> + <edge from-layer="536" from-port="0" to-layer="538" to-port="1" /> + <edge from-layer="537" from-port="0" to-layer="538" to-port="2" /> + <edge from-layer="538" from-port="3" to-layer="543" to-port="0" /> + <edge from-layer="539" from-port="1" to-layer="542" to-port="0" /> + <edge from-layer="540" from-port="0" to-layer="542" to-port="1" /> + <edge from-layer="541" from-port="0" to-layer="542" to-port="2" /> + <edge from-layer="542" from-port="3" to-layer="543" to-port="1" /> + <edge from-layer="543" from-port="2" to-layer="546" to-port="2" /> + <edge from-layer="544" from-port="0" to-layer="546" to-port="3" /> + <edge from-layer="545" from-port="0" to-layer="546" to-port="4" /> + <edge from-layer="546" from-port="5" to-layer="547" to-port="3" /> + <edge from-layer="547" from-port="4" to-layer="549" to-port="0" /> + <edge from-layer="548" from-port="0" to-layer="549" to-port="1" /> + <edge from-layer="549" from-port="2" to-layer="551" to-port="0" /> + <edge from-layer="550" from-port="0" to-layer="551" to-port="1" /> + <edge from-layer="551" from-port="2" to-layer="562" to-port="0" /> + <edge from-layer="552" from-port="0" to-layer="553" to-port="0" /> + <edge from-layer="553" from-port="1" to-layer="556" to-port="0" /> + <edge from-layer="554" from-port="0" to-layer="555" to-port="0" /> + <edge from-layer="555" from-port="1" to-layer="556" to-port="1" /> + <edge from-layer="556" from-port="2" to-layer="558" to-port="0" /> + <edge from-layer="557" from-port="0" to-layer="558" to-port="1" /> + <edge from-layer="558" from-port="2" to-layer="560" to-port="0" /> + <edge from-layer="559" from-port="0" to-layer="560" to-port="1" /> + <edge from-layer="560" from-port="2" to-layer="561" to-port="0" /> + <edge from-layer="561" from-port="1" to-layer="562" to-port="1" /> + <edge from-layer="562" from-port="2" to-layer="563" to-port="1" /> + <edge from-layer="563" from-port="2" to-layer="567" to-port="0" /> + <edge from-layer="563" from-port="2" to-layer="611" to-port="0" /> + <edge from-layer="563" from-port="2" to-layer="574" to-port="0" /> + <edge from-layer="564" from-port="0" to-layer="575" to-port="0" /> + <edge from-layer="565" from-port="0" to-layer="573" to-port="0" /> + <edge from-layer="566" from-port="0" to-layer="567" to-port="1" /> + <edge from-layer="567" from-port="2" to-layer="569" to-port="0" /> + <edge from-layer="568" from-port="0" to-layer="569" to-port="1" /> + <edge from-layer="569" from-port="2" to-layer="571" to-port="0" /> + <edge from-layer="570" from-port="0" to-layer="571" to-port="1" /> + <edge from-layer="571" from-port="2" to-layer="572" to-port="0" /> + <edge from-layer="572" from-port="1" to-layer="573" to-port="1" /> + <edge from-layer="573" from-port="2" to-layer="574" to-port="1" /> + <edge from-layer="574" from-port="2" to-layer="575" to-port="1" /> + <edge from-layer="575" from-port="2" to-layer="586" to-port="0" /> + <edge from-layer="575" from-port="2" to-layer="598" to-port="0" /> + <edge from-layer="576" from-port="0" to-layer="577" to-port="0" /> + <edge from-layer="577" from-port="1" to-layer="580" to-port="0" /> + <edge from-layer="578" from-port="0" to-layer="579" to-port="0" /> + <edge from-layer="579" from-port="1" to-layer="580" to-port="1" /> + <edge from-layer="580" from-port="2" to-layer="582" to-port="0" /> + <edge from-layer="581" from-port="0" to-layer="582" to-port="1" /> + <edge from-layer="582" from-port="2" to-layer="584" to-port="0" /> + <edge from-layer="583" from-port="0" to-layer="584" to-port="1" /> + <edge from-layer="584" from-port="2" to-layer="585" to-port="0" /> + <edge from-layer="585" from-port="1" to-layer="586" to-port="1" /> + <edge from-layer="586" from-port="2" to-layer="587" to-port="0" /> + <edge from-layer="587" from-port="1" to-layer="599" to-port="0" /> + <edge from-layer="588" from-port="0" to-layer="589" to-port="0" /> + <edge from-layer="589" from-port="1" to-layer="592" to-port="0" /> + <edge from-layer="590" from-port="0" to-layer="591" to-port="0" /> + <edge from-layer="591" from-port="1" to-layer="592" to-port="1" /> + <edge from-layer="592" from-port="2" to-layer="594" to-port="0" /> + <edge from-layer="593" from-port="0" to-layer="594" to-port="1" /> + <edge from-layer="594" from-port="2" to-layer="596" to-port="0" /> + <edge from-layer="595" from-port="0" to-layer="596" to-port="1" /> + <edge from-layer="596" from-port="2" to-layer="597" to-port="0" /> + <edge from-layer="597" from-port="1" to-layer="598" to-port="1" /> + <edge from-layer="598" from-port="2" to-layer="599" to-port="1" /> + <edge from-layer="599" from-port="2" to-layer="610" to-port="0" /> + <edge from-layer="600" from-port="0" to-layer="601" to-port="0" /> + <edge from-layer="601" from-port="1" to-layer="604" to-port="0" /> + <edge from-layer="602" from-port="0" to-layer="603" to-port="0" /> + <edge from-layer="603" from-port="1" to-layer="604" to-port="1" /> + <edge from-layer="604" from-port="2" to-layer="606" to-port="0" /> + <edge from-layer="605" from-port="0" to-layer="606" to-port="1" /> + <edge from-layer="606" from-port="2" to-layer="608" to-port="0" /> + <edge from-layer="607" from-port="0" to-layer="608" to-port="1" /> + <edge from-layer="608" from-port="2" to-layer="609" to-port="0" /> + <edge from-layer="609" from-port="1" to-layer="610" to-port="1" /> + <edge from-layer="610" from-port="2" to-layer="611" to-port="1" /> + <edge from-layer="611" from-port="2" to-layer="615" to-port="0" /> + <edge from-layer="611" from-port="2" to-layer="795" to-port="0" /> + <edge from-layer="611" from-port="2" to-layer="622" to-port="0" /> + <edge from-layer="612" from-port="0" to-layer="623" to-port="0" /> + <edge from-layer="613" from-port="0" to-layer="621" to-port="0" /> + <edge from-layer="614" from-port="0" to-layer="615" to-port="1" /> + <edge from-layer="615" from-port="2" to-layer="617" to-port="0" /> + <edge from-layer="616" from-port="0" to-layer="617" to-port="1" /> + <edge from-layer="617" from-port="2" to-layer="619" to-port="0" /> + <edge from-layer="618" from-port="0" to-layer="619" to-port="1" /> + <edge from-layer="619" from-port="2" to-layer="620" to-port="0" /> + <edge from-layer="620" from-port="1" to-layer="621" to-port="1" /> + <edge from-layer="621" from-port="2" to-layer="622" to-port="1" /> + <edge from-layer="622" from-port="2" to-layer="623" to-port="1" /> + <edge from-layer="623" from-port="2" to-layer="744" to-port="0" /> + <edge from-layer="623" from-port="2" to-layer="682" to-port="0" /> + <edge from-layer="623" from-port="2" to-layer="634" to-port="0" /> + <edge from-layer="624" from-port="0" to-layer="625" to-port="0" /> + <edge from-layer="625" from-port="1" to-layer="628" to-port="0" /> + <edge from-layer="626" from-port="0" to-layer="627" to-port="0" /> + <edge from-layer="627" from-port="1" to-layer="628" to-port="1" /> + <edge from-layer="628" from-port="2" to-layer="630" to-port="0" /> + <edge from-layer="629" from-port="0" to-layer="630" to-port="1" /> + <edge from-layer="630" from-port="2" to-layer="632" to-port="0" /> + <edge from-layer="631" from-port="0" to-layer="632" to-port="1" /> + <edge from-layer="632" from-port="2" to-layer="633" to-port="0" /> + <edge from-layer="633" from-port="1" to-layer="634" to-port="1" /> + <edge from-layer="634" from-port="2" to-layer="637" to-port="0" /> + <edge from-layer="635" from-port="0" to-layer="636" to-port="0" /> + <edge from-layer="636" from-port="1" to-layer="637" to-port="1" /> + <edge from-layer="637" from-port="2" to-layer="639" to-port="0" /> + <edge from-layer="638" from-port="0" to-layer="639" to-port="1" /> + <edge from-layer="639" from-port="2" to-layer="641" to-port="0" /> + <edge from-layer="640" from-port="0" to-layer="641" to-port="1" /> + <edge from-layer="641" from-port="2" to-layer="643" to-port="0" /> + <edge from-layer="641" from-port="2" to-layer="659" to-port="0" /> + <edge from-layer="641" from-port="2" to-layer="642" to-port="0" /> + <edge from-layer="641" from-port="2" to-layer="653" to-port="0" /> + <edge from-layer="642" from-port="2" to-layer="662" to-port="0" /> + <edge from-layer="643" from-port="1" to-layer="645" to-port="0" /> + <edge from-layer="644" from-port="0" to-layer="645" to-port="2" /> + <edge from-layer="645" from-port="3" to-layer="646" to-port="0" /> + <edge from-layer="646" from-port="2" to-layer="647" to-port="0" /> + <edge from-layer="647" from-port="1" to-layer="649" to-port="0" /> + <edge from-layer="648" from-port="0" to-layer="649" to-port="1" /> + <edge from-layer="649" from-port="2" to-layer="659" to-port="2" /> + <edge from-layer="649" from-port="2" to-layer="653" to-port="1" /> + <edge from-layer="650" from-port="0" to-layer="653" to-port="2" /> + <edge from-layer="651" from-port="0" to-layer="653" to-port="3" /> + <edge from-layer="652" from-port="0" to-layer="653" to-port="4" /> + <edge from-layer="653" from-port="5" to-layer="655" to-port="0" /> + <edge from-layer="654" from-port="0" to-layer="655" to-port="1" /> + <edge from-layer="655" from-port="2" to-layer="660" to-port="0" /> + <edge from-layer="656" from-port="0" to-layer="659" to-port="1" /> + <edge from-layer="657" from-port="0" to-layer="659" to-port="3" /> + <edge from-layer="658" from-port="0" to-layer="659" to-port="4" /> + <edge from-layer="659" from-port="5" to-layer="660" to-port="1" /> + <edge from-layer="660" from-port="2" to-layer="661" to-port="0" /> + <edge from-layer="661" from-port="2" to-layer="662" to-port="1" /> + <edge from-layer="662" from-port="2" to-layer="779" to-port="0" /> + <edge from-layer="663" from-port="0" to-layer="668" to-port="0" /> + <edge from-layer="664" from-port="0" to-layer="667" to-port="1" /> + <edge from-layer="665" from-port="0" to-layer="667" to-port="2" /> + <edge from-layer="666" from-port="0" to-layer="667" to-port="3" /> + <edge from-layer="667" from-port="4" to-layer="668" to-port="1" /> + <edge from-layer="668" from-port="2" to-layer="669" to-port="0" /> + <edge from-layer="669" from-port="1" to-layer="671" to-port="0" /> + <edge from-layer="670" from-port="0" to-layer="671" to-port="2" /> + <edge from-layer="671" from-port="3" to-layer="767" to-port="0" /> + <edge from-layer="671" from-port="3" to-layer="711" to-port="0" /> + <edge from-layer="672" from-port="0" to-layer="673" to-port="0" /> + <edge from-layer="673" from-port="1" to-layer="676" to-port="0" /> + <edge from-layer="674" from-port="0" to-layer="675" to-port="0" /> + <edge from-layer="675" from-port="1" to-layer="676" to-port="1" /> + <edge from-layer="676" from-port="2" to-layer="678" to-port="0" /> + <edge from-layer="677" from-port="0" to-layer="678" to-port="1" /> + <edge from-layer="678" from-port="2" to-layer="680" to-port="0" /> + <edge from-layer="679" from-port="0" to-layer="680" to-port="1" /> + <edge from-layer="680" from-port="2" to-layer="681" to-port="0" /> + <edge from-layer="681" from-port="1" to-layer="682" to-port="1" /> + <edge from-layer="682" from-port="2" to-layer="685" to-port="0" /> + <edge from-layer="683" from-port="0" to-layer="684" to-port="0" /> + <edge from-layer="684" from-port="1" to-layer="685" to-port="1" /> + <edge from-layer="685" from-port="2" to-layer="687" to-port="0" /> + <edge from-layer="686" from-port="0" to-layer="687" to-port="1" /> + <edge from-layer="687" from-port="2" to-layer="689" to-port="0" /> + <edge from-layer="688" from-port="0" to-layer="689" to-port="1" /> + <edge from-layer="689" from-port="2" to-layer="690" to-port="0" /> + <edge from-layer="689" from-port="2" to-layer="691" to-port="0" /> + <edge from-layer="689" from-port="2" to-layer="707" to-port="0" /> + <edge from-layer="689" from-port="2" to-layer="701" to-port="0" /> + <edge from-layer="690" from-port="2" to-layer="710" to-port="0" /> + <edge from-layer="691" from-port="1" to-layer="693" to-port="0" /> + <edge from-layer="692" from-port="0" to-layer="693" to-port="2" /> + <edge from-layer="693" from-port="3" to-layer="694" to-port="0" /> + <edge from-layer="694" from-port="2" to-layer="695" to-port="0" /> + <edge from-layer="695" from-port="1" to-layer="697" to-port="0" /> + <edge from-layer="696" from-port="0" to-layer="697" to-port="1" /> + <edge from-layer="697" from-port="2" to-layer="701" to-port="1" /> + <edge from-layer="697" from-port="2" to-layer="707" to-port="2" /> + <edge from-layer="698" from-port="0" to-layer="701" to-port="2" /> + <edge from-layer="699" from-port="0" to-layer="701" to-port="3" /> + <edge from-layer="700" from-port="0" to-layer="701" to-port="4" /> + <edge from-layer="701" from-port="5" to-layer="703" to-port="0" /> + <edge from-layer="702" from-port="0" to-layer="703" to-port="1" /> + <edge from-layer="703" from-port="2" to-layer="708" to-port="0" /> + <edge from-layer="704" from-port="0" to-layer="707" to-port="1" /> + <edge from-layer="705" from-port="0" to-layer="707" to-port="3" /> + <edge from-layer="706" from-port="0" to-layer="707" to-port="4" /> + <edge from-layer="707" from-port="5" to-layer="708" to-port="1" /> + <edge from-layer="708" from-port="2" to-layer="709" to-port="0" /> + <edge from-layer="709" from-port="2" to-layer="710" to-port="1" /> + <edge from-layer="710" from-port="2" to-layer="771" to-port="0" /> + <edge from-layer="710" from-port="2" to-layer="711" to-port="1" /> + <edge from-layer="711" from-port="2" to-layer="712" to-port="0" /> + <edge from-layer="711" from-port="2" to-layer="11202" to-port="0" /> + <edge from-layer="711" from-port="2" to-layer="713" to-port="0" /> + <edge from-layer="712" from-port="2" to-layer="722" to-port="0" /> + <edge from-layer="713" from-port="1" to-layer="716" to-port="0" /> + <edge from-layer="713" from-port="1" to-layer="720" to-port="0" /> + <edge from-layer="714" from-port="0" to-layer="716" to-port="1" /> + <edge from-layer="715" from-port="0" to-layer="716" to-port="2" /> + <edge from-layer="716" from-port="3" to-layer="721" to-port="0" /> + <edge from-layer="717" from-port="0" to-layer="721" to-port="1" /> + <edge from-layer="718" from-port="0" to-layer="720" to-port="1" /> + <edge from-layer="719" from-port="0" to-layer="720" to-port="2" /> + <edge from-layer="720" from-port="3" to-layer="721" to-port="2" /> + <edge from-layer="721" from-port="3" to-layer="722" to-port="1" /> + <edge from-layer="722" from-port="2" to-layer="724" to-port="0" /> + <edge from-layer="723" from-port="0" to-layer="724" to-port="1" /> + <edge from-layer="724" from-port="2" to-layer="779" to-port="1" /> + <edge from-layer="725" from-port="0" to-layer="730" to-port="0" /> + <edge from-layer="726" from-port="0" to-layer="729" to-port="1" /> + <edge from-layer="727" from-port="0" to-layer="729" to-port="2" /> + <edge from-layer="728" from-port="0" to-layer="729" to-port="3" /> + <edge from-layer="729" from-port="4" to-layer="730" to-port="1" /> + <edge from-layer="730" from-port="2" to-layer="731" to-port="0" /> + <edge from-layer="731" from-port="1" to-layer="733" to-port="0" /> + <edge from-layer="732" from-port="0" to-layer="733" to-port="2" /> + <edge from-layer="733" from-port="3" to-layer="752" to-port="0" /> + <edge from-layer="734" from-port="0" to-layer="735" to-port="0" /> + <edge from-layer="735" from-port="1" to-layer="738" to-port="0" /> + <edge from-layer="736" from-port="0" to-layer="737" to-port="0" /> + <edge from-layer="737" from-port="1" to-layer="738" to-port="1" /> + <edge from-layer="738" from-port="2" to-layer="740" to-port="0" /> + <edge from-layer="739" from-port="0" to-layer="740" to-port="1" /> + <edge from-layer="740" from-port="2" to-layer="742" to-port="0" /> + <edge from-layer="741" from-port="0" to-layer="742" to-port="1" /> + <edge from-layer="742" from-port="2" to-layer="743" to-port="0" /> + <edge from-layer="743" from-port="1" to-layer="744" to-port="1" /> + <edge from-layer="744" from-port="2" to-layer="747" to-port="0" /> + <edge from-layer="745" from-port="0" to-layer="746" to-port="0" /> + <edge from-layer="746" from-port="1" to-layer="747" to-port="1" /> + <edge from-layer="747" from-port="2" to-layer="749" to-port="0" /> + <edge from-layer="748" from-port="0" to-layer="749" to-port="1" /> + <edge from-layer="749" from-port="2" to-layer="751" to-port="0" /> + <edge from-layer="750" from-port="0" to-layer="751" to-port="1" /> + <edge from-layer="751" from-port="2" to-layer="752" to-port="1" /> + <edge from-layer="752" from-port="2" to-layer="754" to-port="0" /> + <edge from-layer="752" from-port="2" to-layer="11201" to-port="0" /> + <edge from-layer="752" from-port="2" to-layer="753" to-port="0" /> + <edge from-layer="753" from-port="2" to-layer="763" to-port="0" /> + <edge from-layer="754" from-port="1" to-layer="757" to-port="0" /> + <edge from-layer="754" from-port="1" to-layer="761" to-port="0" /> + <edge from-layer="755" from-port="0" to-layer="757" to-port="1" /> + <edge from-layer="756" from-port="0" to-layer="757" to-port="2" /> + <edge from-layer="757" from-port="3" to-layer="762" to-port="1" /> + <edge from-layer="758" from-port="0" to-layer="762" to-port="2" /> + <edge from-layer="759" from-port="0" to-layer="761" to-port="1" /> + <edge from-layer="760" from-port="0" to-layer="761" to-port="2" /> + <edge from-layer="761" from-port="3" to-layer="762" to-port="3" /> + <edge from-layer="762" from-port="4" to-layer="763" to-port="1" /> + <edge from-layer="763" from-port="2" to-layer="765" to-port="0" /> + <edge from-layer="764" from-port="0" to-layer="765" to-port="1" /> + <edge from-layer="765" from-port="2" to-layer="779" to-port="2" /> + <edge from-layer="766" from-port="0" to-layer="778" to-port="1" /> + <edge from-layer="767" from-port="1" to-layer="770" to-port="0" /> + <edge from-layer="768" from-port="0" to-layer="770" to-port="1" /> + <edge from-layer="769" from-port="0" to-layer="770" to-port="2" /> + <edge from-layer="770" from-port="3" to-layer="775" to-port="0" /> + <edge from-layer="771" from-port="1" to-layer="774" to-port="0" /> + <edge from-layer="772" from-port="0" to-layer="774" to-port="1" /> + <edge from-layer="773" from-port="0" to-layer="774" to-port="2" /> + <edge from-layer="774" from-port="3" to-layer="775" to-port="1" /> + <edge from-layer="775" from-port="2" to-layer="778" to-port="2" /> + <edge from-layer="776" from-port="0" to-layer="778" to-port="3" /> + <edge from-layer="777" from-port="0" to-layer="778" to-port="4" /> + <edge from-layer="778" from-port="5" to-layer="779" to-port="3" /> + <edge from-layer="779" from-port="4" to-layer="781" to-port="0" /> + <edge from-layer="780" from-port="0" to-layer="781" to-port="1" /> + <edge from-layer="781" from-port="2" to-layer="783" to-port="0" /> + <edge from-layer="782" from-port="0" to-layer="783" to-port="1" /> + <edge from-layer="783" from-port="2" to-layer="794" to-port="0" /> + <edge from-layer="784" from-port="0" to-layer="785" to-port="0" /> + <edge from-layer="785" from-port="1" to-layer="788" to-port="0" /> + <edge from-layer="786" from-port="0" to-layer="787" to-port="0" /> + <edge from-layer="787" from-port="1" to-layer="788" to-port="1" /> + <edge from-layer="788" from-port="2" to-layer="790" to-port="0" /> + <edge from-layer="789" from-port="0" to-layer="790" to-port="1" /> + <edge from-layer="790" from-port="2" to-layer="792" to-port="0" /> + <edge from-layer="791" from-port="0" to-layer="792" to-port="1" /> + <edge from-layer="792" from-port="2" to-layer="793" to-port="0" /> + <edge from-layer="793" from-port="1" to-layer="794" to-port="1" /> + <edge from-layer="794" from-port="2" to-layer="795" to-port="1" /> + <edge from-layer="795" from-port="2" to-layer="799" to-port="0" /> + <edge from-layer="795" from-port="2" to-layer="843" to-port="0" /> + <edge from-layer="795" from-port="2" to-layer="806" to-port="0" /> + <edge from-layer="796" from-port="0" to-layer="807" to-port="0" /> + <edge from-layer="797" from-port="0" to-layer="805" to-port="0" /> + <edge from-layer="798" from-port="0" to-layer="799" to-port="1" /> + <edge from-layer="799" from-port="2" to-layer="801" to-port="0" /> + <edge from-layer="800" from-port="0" to-layer="801" to-port="1" /> + <edge from-layer="801" from-port="2" to-layer="803" to-port="0" /> + <edge from-layer="802" from-port="0" to-layer="803" to-port="1" /> + <edge from-layer="803" from-port="2" to-layer="804" to-port="0" /> + <edge from-layer="804" from-port="1" to-layer="805" to-port="1" /> + <edge from-layer="805" from-port="2" to-layer="806" to-port="1" /> + <edge from-layer="806" from-port="2" to-layer="807" to-port="1" /> + <edge from-layer="807" from-port="2" to-layer="830" to-port="0" /> + <edge from-layer="807" from-port="2" to-layer="818" to-port="0" /> + <edge from-layer="808" from-port="0" to-layer="809" to-port="0" /> + <edge from-layer="809" from-port="1" to-layer="812" to-port="0" /> + <edge from-layer="810" from-port="0" to-layer="811" to-port="0" /> + <edge from-layer="811" from-port="1" to-layer="812" to-port="1" /> + <edge from-layer="812" from-port="2" to-layer="814" to-port="0" /> + <edge from-layer="813" from-port="0" to-layer="814" to-port="1" /> + <edge from-layer="814" from-port="2" to-layer="816" to-port="0" /> + <edge from-layer="815" from-port="0" to-layer="816" to-port="1" /> + <edge from-layer="816" from-port="2" to-layer="817" to-port="0" /> + <edge from-layer="817" from-port="1" to-layer="818" to-port="1" /> + <edge from-layer="818" from-port="2" to-layer="819" to-port="0" /> + <edge from-layer="819" from-port="1" to-layer="831" to-port="0" /> + <edge from-layer="820" from-port="0" to-layer="821" to-port="0" /> + <edge from-layer="821" from-port="1" to-layer="824" to-port="0" /> + <edge from-layer="822" from-port="0" to-layer="823" to-port="0" /> + <edge from-layer="823" from-port="1" to-layer="824" to-port="1" /> + <edge from-layer="824" from-port="2" to-layer="826" to-port="0" /> + <edge from-layer="825" from-port="0" to-layer="826" to-port="1" /> + <edge from-layer="826" from-port="2" to-layer="828" to-port="0" /> + <edge from-layer="827" from-port="0" to-layer="828" to-port="1" /> + <edge from-layer="828" from-port="2" to-layer="829" to-port="0" /> + <edge from-layer="829" from-port="1" to-layer="830" to-port="1" /> + <edge from-layer="830" from-port="2" to-layer="831" to-port="1" /> + <edge from-layer="831" from-port="2" to-layer="842" to-port="0" /> + <edge from-layer="832" from-port="0" to-layer="833" to-port="0" /> + <edge from-layer="833" from-port="1" to-layer="836" to-port="0" /> + <edge from-layer="834" from-port="0" to-layer="835" to-port="0" /> + <edge from-layer="835" from-port="1" to-layer="836" to-port="1" /> + <edge from-layer="836" from-port="2" to-layer="838" to-port="0" /> + <edge from-layer="837" from-port="0" to-layer="838" to-port="1" /> + <edge from-layer="838" from-port="2" to-layer="840" to-port="0" /> + <edge from-layer="839" from-port="0" to-layer="840" to-port="1" /> + <edge from-layer="840" from-port="2" to-layer="841" to-port="0" /> + <edge from-layer="841" from-port="1" to-layer="842" to-port="1" /> + <edge from-layer="842" from-port="2" to-layer="843" to-port="1" /> + <edge from-layer="843" from-port="2" to-layer="1027" to-port="0" /> + <edge from-layer="843" from-port="2" to-layer="847" to-port="0" /> + <edge from-layer="843" from-port="2" to-layer="854" to-port="0" /> + <edge from-layer="844" from-port="0" to-layer="855" to-port="0" /> + <edge from-layer="845" from-port="0" to-layer="853" to-port="0" /> + <edge from-layer="846" from-port="0" to-layer="847" to-port="1" /> + <edge from-layer="847" from-port="2" to-layer="849" to-port="0" /> + <edge from-layer="848" from-port="0" to-layer="849" to-port="1" /> + <edge from-layer="849" from-port="2" to-layer="851" to-port="0" /> + <edge from-layer="850" from-port="0" to-layer="851" to-port="1" /> + <edge from-layer="851" from-port="2" to-layer="852" to-port="0" /> + <edge from-layer="852" from-port="1" to-layer="853" to-port="1" /> + <edge from-layer="853" from-port="2" to-layer="854" to-port="1" /> + <edge from-layer="854" from-port="2" to-layer="855" to-port="1" /> + <edge from-layer="855" from-port="2" to-layer="976" to-port="0" /> + <edge from-layer="855" from-port="2" to-layer="866" to-port="0" /> + <edge from-layer="855" from-port="2" to-layer="914" to-port="0" /> + <edge from-layer="856" from-port="0" to-layer="857" to-port="0" /> + <edge from-layer="857" from-port="1" to-layer="860" to-port="0" /> + <edge from-layer="858" from-port="0" to-layer="859" to-port="0" /> + <edge from-layer="859" from-port="1" to-layer="860" to-port="1" /> + <edge from-layer="860" from-port="2" to-layer="862" to-port="0" /> + <edge from-layer="861" from-port="0" to-layer="862" to-port="1" /> + <edge from-layer="862" from-port="2" to-layer="864" to-port="0" /> + <edge from-layer="863" from-port="0" to-layer="864" to-port="1" /> + <edge from-layer="864" from-port="2" to-layer="865" to-port="0" /> + <edge from-layer="865" from-port="1" to-layer="866" to-port="1" /> + <edge from-layer="866" from-port="2" to-layer="869" to-port="0" /> + <edge from-layer="867" from-port="0" to-layer="868" to-port="0" /> + <edge from-layer="868" from-port="1" to-layer="869" to-port="1" /> + <edge from-layer="869" from-port="2" to-layer="871" to-port="0" /> + <edge from-layer="870" from-port="0" to-layer="871" to-port="1" /> + <edge from-layer="871" from-port="2" to-layer="873" to-port="0" /> + <edge from-layer="872" from-port="0" to-layer="873" to-port="1" /> + <edge from-layer="873" from-port="2" to-layer="891" to-port="0" /> + <edge from-layer="873" from-port="2" to-layer="885" to-port="0" /> + <edge from-layer="873" from-port="2" to-layer="874" to-port="0" /> + <edge from-layer="873" from-port="2" to-layer="875" to-port="0" /> + <edge from-layer="874" from-port="2" to-layer="894" to-port="0" /> + <edge from-layer="875" from-port="1" to-layer="877" to-port="0" /> + <edge from-layer="876" from-port="0" to-layer="877" to-port="2" /> + <edge from-layer="877" from-port="3" to-layer="878" to-port="0" /> + <edge from-layer="878" from-port="2" to-layer="879" to-port="0" /> + <edge from-layer="879" from-port="1" to-layer="881" to-port="0" /> + <edge from-layer="880" from-port="0" to-layer="881" to-port="1" /> + <edge from-layer="881" from-port="2" to-layer="885" to-port="1" /> + <edge from-layer="881" from-port="2" to-layer="891" to-port="2" /> + <edge from-layer="882" from-port="0" to-layer="885" to-port="2" /> + <edge from-layer="883" from-port="0" to-layer="885" to-port="3" /> + <edge from-layer="884" from-port="0" to-layer="885" to-port="4" /> + <edge from-layer="885" from-port="5" to-layer="887" to-port="0" /> + <edge from-layer="886" from-port="0" to-layer="887" to-port="1" /> + <edge from-layer="887" from-port="2" to-layer="892" to-port="0" /> + <edge from-layer="888" from-port="0" to-layer="891" to-port="1" /> + <edge from-layer="889" from-port="0" to-layer="891" to-port="3" /> + <edge from-layer="890" from-port="0" to-layer="891" to-port="4" /> + <edge from-layer="891" from-port="5" to-layer="892" to-port="1" /> + <edge from-layer="892" from-port="2" to-layer="893" to-port="0" /> + <edge from-layer="893" from-port="2" to-layer="894" to-port="1" /> + <edge from-layer="894" from-port="2" to-layer="1011" to-port="0" /> + <edge from-layer="895" from-port="0" to-layer="900" to-port="0" /> + <edge from-layer="896" from-port="0" to-layer="899" to-port="1" /> + <edge from-layer="897" from-port="0" to-layer="899" to-port="2" /> + <edge from-layer="898" from-port="0" to-layer="899" to-port="3" /> + <edge from-layer="899" from-port="4" to-layer="900" to-port="1" /> + <edge from-layer="900" from-port="2" to-layer="901" to-port="0" /> + <edge from-layer="901" from-port="1" to-layer="903" to-port="0" /> + <edge from-layer="902" from-port="0" to-layer="903" to-port="2" /> + <edge from-layer="903" from-port="3" to-layer="999" to-port="0" /> + <edge from-layer="903" from-port="3" to-layer="943" to-port="0" /> + <edge from-layer="904" from-port="0" to-layer="905" to-port="0" /> + <edge from-layer="905" from-port="1" to-layer="908" to-port="0" /> + <edge from-layer="906" from-port="0" to-layer="907" to-port="0" /> + <edge from-layer="907" from-port="1" to-layer="908" to-port="1" /> + <edge from-layer="908" from-port="2" to-layer="910" to-port="0" /> + <edge from-layer="909" from-port="0" to-layer="910" to-port="1" /> + <edge from-layer="910" from-port="2" to-layer="912" to-port="0" /> + <edge from-layer="911" from-port="0" to-layer="912" to-port="1" /> + <edge from-layer="912" from-port="2" to-layer="913" to-port="0" /> + <edge from-layer="913" from-port="1" to-layer="914" to-port="1" /> + <edge from-layer="914" from-port="2" to-layer="917" to-port="0" /> + <edge from-layer="915" from-port="0" to-layer="916" to-port="0" /> + <edge from-layer="916" from-port="1" to-layer="917" to-port="1" /> + <edge from-layer="917" from-port="2" to-layer="919" to-port="0" /> + <edge from-layer="918" from-port="0" to-layer="919" to-port="1" /> + <edge from-layer="919" from-port="2" to-layer="921" to-port="0" /> + <edge from-layer="920" from-port="0" to-layer="921" to-port="1" /> + <edge from-layer="921" from-port="2" to-layer="922" to-port="0" /> + <edge from-layer="921" from-port="2" to-layer="933" to-port="0" /> + <edge from-layer="921" from-port="2" to-layer="939" to-port="0" /> + <edge from-layer="921" from-port="2" to-layer="923" to-port="0" /> + <edge from-layer="922" from-port="2" to-layer="942" to-port="0" /> + <edge from-layer="923" from-port="1" to-layer="925" to-port="0" /> + <edge from-layer="924" from-port="0" to-layer="925" to-port="2" /> + <edge from-layer="925" from-port="3" to-layer="926" to-port="0" /> + <edge from-layer="926" from-port="2" to-layer="927" to-port="0" /> + <edge from-layer="927" from-port="1" to-layer="929" to-port="0" /> + <edge from-layer="928" from-port="0" to-layer="929" to-port="1" /> + <edge from-layer="929" from-port="2" to-layer="933" to-port="1" /> + <edge from-layer="929" from-port="2" to-layer="939" to-port="2" /> + <edge from-layer="930" from-port="0" to-layer="933" to-port="2" /> + <edge from-layer="931" from-port="0" to-layer="933" to-port="3" /> + <edge from-layer="932" from-port="0" to-layer="933" to-port="4" /> + <edge from-layer="933" from-port="5" to-layer="935" to-port="0" /> + <edge from-layer="934" from-port="0" to-layer="935" to-port="1" /> + <edge from-layer="935" from-port="2" to-layer="940" to-port="0" /> + <edge from-layer="936" from-port="0" to-layer="939" to-port="1" /> + <edge from-layer="937" from-port="0" to-layer="939" to-port="3" /> + <edge from-layer="938" from-port="0" to-layer="939" to-port="4" /> + <edge from-layer="939" from-port="5" to-layer="940" to-port="1" /> + <edge from-layer="940" from-port="2" to-layer="941" to-port="0" /> + <edge from-layer="941" from-port="2" to-layer="942" to-port="1" /> + <edge from-layer="942" from-port="2" to-layer="943" to-port="1" /> + <edge from-layer="942" from-port="2" to-layer="1003" to-port="0" /> + <edge from-layer="943" from-port="2" to-layer="944" to-port="0" /> + <edge from-layer="943" from-port="2" to-layer="945" to-port="0" /> + <edge from-layer="943" from-port="2" to-layer="11180" to-port="0" /> + <edge from-layer="944" from-port="2" to-layer="954" to-port="0" /> + <edge from-layer="945" from-port="1" to-layer="948" to-port="0" /> + <edge from-layer="945" from-port="1" to-layer="952" to-port="0" /> + <edge from-layer="946" from-port="0" to-layer="948" to-port="1" /> + <edge from-layer="947" from-port="0" to-layer="948" to-port="2" /> + <edge from-layer="948" from-port="3" to-layer="953" to-port="0" /> + <edge from-layer="949" from-port="0" to-layer="953" to-port="1" /> + <edge from-layer="950" from-port="0" to-layer="952" to-port="1" /> + <edge from-layer="951" from-port="0" to-layer="952" to-port="2" /> + <edge from-layer="952" from-port="3" to-layer="953" to-port="2" /> + <edge from-layer="953" from-port="3" to-layer="954" to-port="1" /> + <edge from-layer="954" from-port="2" to-layer="956" to-port="0" /> + <edge from-layer="955" from-port="0" to-layer="956" to-port="1" /> + <edge from-layer="956" from-port="2" to-layer="1011" to-port="1" /> + <edge from-layer="957" from-port="0" to-layer="962" to-port="0" /> + <edge from-layer="958" from-port="0" to-layer="961" to-port="1" /> + <edge from-layer="959" from-port="0" to-layer="961" to-port="2" /> + <edge from-layer="960" from-port="0" to-layer="961" to-port="3" /> + <edge from-layer="961" from-port="4" to-layer="962" to-port="1" /> + <edge from-layer="962" from-port="2" to-layer="963" to-port="0" /> + <edge from-layer="963" from-port="1" to-layer="965" to-port="0" /> + <edge from-layer="964" from-port="0" to-layer="965" to-port="2" /> + <edge from-layer="965" from-port="3" to-layer="984" to-port="0" /> + <edge from-layer="966" from-port="0" to-layer="967" to-port="0" /> + <edge from-layer="967" from-port="1" to-layer="970" to-port="0" /> + <edge from-layer="968" from-port="0" to-layer="969" to-port="0" /> + <edge from-layer="969" from-port="1" to-layer="970" to-port="1" /> + <edge from-layer="970" from-port="2" to-layer="972" to-port="0" /> + <edge from-layer="971" from-port="0" to-layer="972" to-port="1" /> + <edge from-layer="972" from-port="2" to-layer="974" to-port="0" /> + <edge from-layer="973" from-port="0" to-layer="974" to-port="1" /> + <edge from-layer="974" from-port="2" to-layer="975" to-port="0" /> + <edge from-layer="975" from-port="1" to-layer="976" to-port="1" /> + <edge from-layer="976" from-port="2" to-layer="979" to-port="0" /> + <edge from-layer="977" from-port="0" to-layer="978" to-port="0" /> + <edge from-layer="978" from-port="1" to-layer="979" to-port="1" /> + <edge from-layer="979" from-port="2" to-layer="981" to-port="0" /> + <edge from-layer="980" from-port="0" to-layer="981" to-port="1" /> + <edge from-layer="981" from-port="2" to-layer="983" to-port="0" /> + <edge from-layer="982" from-port="0" to-layer="983" to-port="1" /> + <edge from-layer="983" from-port="2" to-layer="984" to-port="1" /> + <edge from-layer="984" from-port="2" to-layer="985" to-port="0" /> + <edge from-layer="984" from-port="2" to-layer="986" to-port="0" /> + <edge from-layer="984" from-port="2" to-layer="11179" to-port="0" /> + <edge from-layer="985" from-port="2" to-layer="995" to-port="0" /> + <edge from-layer="986" from-port="1" to-layer="989" to-port="0" /> + <edge from-layer="986" from-port="1" to-layer="993" to-port="0" /> + <edge from-layer="987" from-port="0" to-layer="989" to-port="1" /> + <edge from-layer="988" from-port="0" to-layer="989" to-port="2" /> + <edge from-layer="989" from-port="3" to-layer="994" to-port="1" /> + <edge from-layer="990" from-port="0" to-layer="994" to-port="2" /> + <edge from-layer="991" from-port="0" to-layer="993" to-port="1" /> + <edge from-layer="992" from-port="0" to-layer="993" to-port="2" /> + <edge from-layer="993" from-port="3" to-layer="994" to-port="3" /> + <edge from-layer="994" from-port="4" to-layer="995" to-port="1" /> + <edge from-layer="995" from-port="2" to-layer="997" to-port="0" /> + <edge from-layer="996" from-port="0" to-layer="997" to-port="1" /> + <edge from-layer="997" from-port="2" to-layer="1011" to-port="2" /> + <edge from-layer="998" from-port="0" to-layer="1010" to-port="1" /> + <edge from-layer="999" from-port="1" to-layer="1002" to-port="0" /> + <edge from-layer="1000" from-port="0" to-layer="1002" to-port="1" /> + <edge from-layer="1001" from-port="0" to-layer="1002" to-port="2" /> + <edge from-layer="1002" from-port="3" to-layer="1007" to-port="0" /> + <edge from-layer="1003" from-port="1" to-layer="1006" to-port="0" /> + <edge from-layer="1004" from-port="0" to-layer="1006" to-port="1" /> + <edge from-layer="1005" from-port="0" to-layer="1006" to-port="2" /> + <edge from-layer="1006" from-port="3" to-layer="1007" to-port="1" /> + <edge from-layer="1007" from-port="2" to-layer="1010" to-port="2" /> + <edge from-layer="1008" from-port="0" to-layer="1010" to-port="3" /> + <edge from-layer="1009" from-port="0" to-layer="1010" to-port="4" /> + <edge from-layer="1010" from-port="5" to-layer="1011" to-port="3" /> + <edge from-layer="1011" from-port="4" to-layer="1013" to-port="0" /> + <edge from-layer="1012" from-port="0" to-layer="1013" to-port="1" /> + <edge from-layer="1013" from-port="2" to-layer="1015" to-port="0" /> + <edge from-layer="1014" from-port="0" to-layer="1015" to-port="1" /> + <edge from-layer="1015" from-port="2" to-layer="1026" to-port="0" /> + <edge from-layer="1016" from-port="0" to-layer="1017" to-port="0" /> + <edge from-layer="1017" from-port="1" to-layer="1020" to-port="0" /> + <edge from-layer="1018" from-port="0" to-layer="1019" to-port="0" /> + <edge from-layer="1019" from-port="1" to-layer="1020" to-port="1" /> + <edge from-layer="1020" from-port="2" to-layer="1022" to-port="0" /> + <edge from-layer="1021" from-port="0" to-layer="1022" to-port="1" /> + <edge from-layer="1022" from-port="2" to-layer="1024" to-port="0" /> + <edge from-layer="1023" from-port="0" to-layer="1024" to-port="1" /> + <edge from-layer="1024" from-port="2" to-layer="1025" to-port="0" /> + <edge from-layer="1025" from-port="1" to-layer="1026" to-port="1" /> + <edge from-layer="1026" from-port="2" to-layer="1027" to-port="1" /> + <edge from-layer="1027" from-port="2" to-layer="1031" to-port="0" /> + <edge from-layer="1027" from-port="2" to-layer="1075" to-port="0" /> + <edge from-layer="1027" from-port="2" to-layer="1038" to-port="0" /> + <edge from-layer="1028" from-port="0" to-layer="1039" to-port="0" /> + <edge from-layer="1029" from-port="0" to-layer="1037" to-port="0" /> + <edge from-layer="1030" from-port="0" to-layer="1031" to-port="1" /> + <edge from-layer="1031" from-port="2" to-layer="1033" to-port="0" /> + <edge from-layer="1032" from-port="0" to-layer="1033" to-port="1" /> + <edge from-layer="1033" from-port="2" to-layer="1035" to-port="0" /> + <edge from-layer="1034" from-port="0" to-layer="1035" to-port="1" /> + <edge from-layer="1035" from-port="2" to-layer="1036" to-port="0" /> + <edge from-layer="1036" from-port="1" to-layer="1037" to-port="1" /> + <edge from-layer="1037" from-port="2" to-layer="1038" to-port="1" /> + <edge from-layer="1038" from-port="2" to-layer="1039" to-port="1" /> + <edge from-layer="1039" from-port="2" to-layer="1050" to-port="0" /> + <edge from-layer="1039" from-port="2" to-layer="1062" to-port="0" /> + <edge from-layer="1040" from-port="0" to-layer="1041" to-port="0" /> + <edge from-layer="1041" from-port="1" to-layer="1044" to-port="0" /> + <edge from-layer="1042" from-port="0" to-layer="1043" to-port="0" /> + <edge from-layer="1043" from-port="1" to-layer="1044" to-port="1" /> + <edge from-layer="1044" from-port="2" to-layer="1046" to-port="0" /> + <edge from-layer="1045" from-port="0" to-layer="1046" to-port="1" /> + <edge from-layer="1046" from-port="2" to-layer="1048" to-port="0" /> + <edge from-layer="1047" from-port="0" to-layer="1048" to-port="1" /> + <edge from-layer="1048" from-port="2" to-layer="1049" to-port="0" /> + <edge from-layer="1049" from-port="1" to-layer="1050" to-port="1" /> + <edge from-layer="1050" from-port="2" to-layer="1051" to-port="0" /> + <edge from-layer="1051" from-port="1" to-layer="1063" to-port="0" /> + <edge from-layer="1052" from-port="0" to-layer="1053" to-port="0" /> + <edge from-layer="1053" from-port="1" to-layer="1056" to-port="0" /> + <edge from-layer="1054" from-port="0" to-layer="1055" to-port="0" /> + <edge from-layer="1055" from-port="1" to-layer="1056" to-port="1" /> + <edge from-layer="1056" from-port="2" to-layer="1058" to-port="0" /> + <edge from-layer="1057" from-port="0" to-layer="1058" to-port="1" /> + <edge from-layer="1058" from-port="2" to-layer="1060" to-port="0" /> + <edge from-layer="1059" from-port="0" to-layer="1060" to-port="1" /> + <edge from-layer="1060" from-port="2" to-layer="1061" to-port="0" /> + <edge from-layer="1061" from-port="1" to-layer="1062" to-port="1" /> + <edge from-layer="1062" from-port="2" to-layer="1063" to-port="1" /> + <edge from-layer="1063" from-port="2" to-layer="1074" to-port="0" /> + <edge from-layer="1064" from-port="0" to-layer="1065" to-port="0" /> + <edge from-layer="1065" from-port="1" to-layer="1068" to-port="0" /> + <edge from-layer="1066" from-port="0" to-layer="1067" to-port="0" /> + <edge from-layer="1067" from-port="1" to-layer="1068" to-port="1" /> + <edge from-layer="1068" from-port="2" to-layer="1070" to-port="0" /> + <edge from-layer="1069" from-port="0" to-layer="1070" to-port="1" /> + <edge from-layer="1070" from-port="2" to-layer="1072" to-port="0" /> + <edge from-layer="1071" from-port="0" to-layer="1072" to-port="1" /> + <edge from-layer="1072" from-port="2" to-layer="1073" to-port="0" /> + <edge from-layer="1073" from-port="1" to-layer="1074" to-port="1" /> + <edge from-layer="1074" from-port="2" to-layer="1075" to-port="1" /> + <edge from-layer="1075" from-port="2" to-layer="1079" to-port="0" /> + <edge from-layer="1075" from-port="2" to-layer="1086" to-port="0" /> + <edge from-layer="1075" from-port="2" to-layer="1259" to-port="0" /> + <edge from-layer="1076" from-port="0" to-layer="1087" to-port="0" /> + <edge from-layer="1077" from-port="0" to-layer="1085" to-port="0" /> + <edge from-layer="1078" from-port="0" to-layer="1079" to-port="1" /> + <edge from-layer="1079" from-port="2" to-layer="1081" to-port="0" /> + <edge from-layer="1080" from-port="0" to-layer="1081" to-port="1" /> + <edge from-layer="1081" from-port="2" to-layer="1083" to-port="0" /> + <edge from-layer="1082" from-port="0" to-layer="1083" to-port="1" /> + <edge from-layer="1083" from-port="2" to-layer="1084" to-port="0" /> + <edge from-layer="1084" from-port="1" to-layer="1085" to-port="1" /> + <edge from-layer="1085" from-port="2" to-layer="1086" to-port="1" /> + <edge from-layer="1086" from-port="2" to-layer="1087" to-port="1" /> + <edge from-layer="1087" from-port="2" to-layer="1146" to-port="0" /> + <edge from-layer="1087" from-port="2" to-layer="1208" to-port="0" /> + <edge from-layer="1087" from-port="2" to-layer="1098" to-port="0" /> + <edge from-layer="1088" from-port="0" to-layer="1089" to-port="0" /> + <edge from-layer="1089" from-port="1" to-layer="1092" to-port="0" /> + <edge from-layer="1090" from-port="0" to-layer="1091" to-port="0" /> + <edge from-layer="1091" from-port="1" to-layer="1092" to-port="1" /> + <edge from-layer="1092" from-port="2" to-layer="1094" to-port="0" /> + <edge from-layer="1093" from-port="0" to-layer="1094" to-port="1" /> + <edge from-layer="1094" from-port="2" to-layer="1096" to-port="0" /> + <edge from-layer="1095" from-port="0" to-layer="1096" to-port="1" /> + <edge from-layer="1096" from-port="2" to-layer="1097" to-port="0" /> + <edge from-layer="1097" from-port="1" to-layer="1098" to-port="1" /> + <edge from-layer="1098" from-port="2" to-layer="1101" to-port="0" /> + <edge from-layer="1099" from-port="0" to-layer="1100" to-port="0" /> + <edge from-layer="1100" from-port="1" to-layer="1101" to-port="1" /> + <edge from-layer="1101" from-port="2" to-layer="1103" to-port="0" /> + <edge from-layer="1102" from-port="0" to-layer="1103" to-port="1" /> + <edge from-layer="1103" from-port="2" to-layer="1105" to-port="0" /> + <edge from-layer="1104" from-port="0" to-layer="1105" to-port="1" /> + <edge from-layer="1105" from-port="2" to-layer="1123" to-port="0" /> + <edge from-layer="1105" from-port="2" to-layer="1117" to-port="0" /> + <edge from-layer="1105" from-port="2" to-layer="1107" to-port="0" /> + <edge from-layer="1105" from-port="2" to-layer="1106" to-port="0" /> + <edge from-layer="1106" from-port="2" to-layer="1126" to-port="0" /> + <edge from-layer="1107" from-port="1" to-layer="1109" to-port="0" /> + <edge from-layer="1108" from-port="0" to-layer="1109" to-port="2" /> + <edge from-layer="1109" from-port="3" to-layer="1110" to-port="0" /> + <edge from-layer="1110" from-port="2" to-layer="1111" to-port="0" /> + <edge from-layer="1111" from-port="1" to-layer="1113" to-port="0" /> + <edge from-layer="1112" from-port="0" to-layer="1113" to-port="1" /> + <edge from-layer="1113" from-port="2" to-layer="1117" to-port="1" /> + <edge from-layer="1113" from-port="2" to-layer="1123" to-port="2" /> + <edge from-layer="1114" from-port="0" to-layer="1117" to-port="2" /> + <edge from-layer="1115" from-port="0" to-layer="1117" to-port="3" /> + <edge from-layer="1116" from-port="0" to-layer="1117" to-port="4" /> + <edge from-layer="1117" from-port="5" to-layer="1119" to-port="0" /> + <edge from-layer="1118" from-port="0" to-layer="1119" to-port="1" /> + <edge from-layer="1119" from-port="2" to-layer="1124" to-port="0" /> + <edge from-layer="1120" from-port="0" to-layer="1123" to-port="1" /> + <edge from-layer="1121" from-port="0" to-layer="1123" to-port="3" /> + <edge from-layer="1122" from-port="0" to-layer="1123" to-port="4" /> + <edge from-layer="1123" from-port="5" to-layer="1124" to-port="1" /> + <edge from-layer="1124" from-port="2" to-layer="1125" to-port="0" /> + <edge from-layer="1125" from-port="2" to-layer="1126" to-port="1" /> + <edge from-layer="1126" from-port="2" to-layer="1243" to-port="0" /> + <edge from-layer="1127" from-port="0" to-layer="1132" to-port="0" /> + <edge from-layer="1128" from-port="0" to-layer="1131" to-port="1" /> + <edge from-layer="1129" from-port="0" to-layer="1131" to-port="2" /> + <edge from-layer="1130" from-port="0" to-layer="1131" to-port="3" /> + <edge from-layer="1131" from-port="4" to-layer="1132" to-port="1" /> + <edge from-layer="1132" from-port="2" to-layer="1133" to-port="0" /> + <edge from-layer="1133" from-port="1" to-layer="1135" to-port="0" /> + <edge from-layer="1134" from-port="0" to-layer="1135" to-port="2" /> + <edge from-layer="1135" from-port="3" to-layer="1231" to-port="0" /> + <edge from-layer="1135" from-port="3" to-layer="1175" to-port="0" /> + <edge from-layer="1136" from-port="0" to-layer="1137" to-port="0" /> + <edge from-layer="1137" from-port="1" to-layer="1140" to-port="0" /> + <edge from-layer="1138" from-port="0" to-layer="1139" to-port="0" /> + <edge from-layer="1139" from-port="1" to-layer="1140" to-port="1" /> + <edge from-layer="1140" from-port="2" to-layer="1142" to-port="0" /> + <edge from-layer="1141" from-port="0" to-layer="1142" to-port="1" /> + <edge from-layer="1142" from-port="2" to-layer="1144" to-port="0" /> + <edge from-layer="1143" from-port="0" to-layer="1144" to-port="1" /> + <edge from-layer="1144" from-port="2" to-layer="1145" to-port="0" /> + <edge from-layer="1145" from-port="1" to-layer="1146" to-port="1" /> + <edge from-layer="1146" from-port="2" to-layer="1149" to-port="0" /> + <edge from-layer="1147" from-port="0" to-layer="1148" to-port="0" /> + <edge from-layer="1148" from-port="1" to-layer="1149" to-port="1" /> + <edge from-layer="1149" from-port="2" to-layer="1151" to-port="0" /> + <edge from-layer="1150" from-port="0" to-layer="1151" to-port="1" /> + <edge from-layer="1151" from-port="2" to-layer="1153" to-port="0" /> + <edge from-layer="1152" from-port="0" to-layer="1153" to-port="1" /> + <edge from-layer="1153" from-port="2" to-layer="1154" to-port="0" /> + <edge from-layer="1153" from-port="2" to-layer="1171" to-port="0" /> + <edge from-layer="1153" from-port="2" to-layer="1155" to-port="0" /> + <edge from-layer="1153" from-port="2" to-layer="1165" to-port="0" /> + <edge from-layer="1154" from-port="2" to-layer="1174" to-port="0" /> + <edge from-layer="1155" from-port="1" to-layer="1157" to-port="0" /> + <edge from-layer="1156" from-port="0" to-layer="1157" to-port="2" /> + <edge from-layer="1157" from-port="3" to-layer="1158" to-port="0" /> + <edge from-layer="1158" from-port="2" to-layer="1159" to-port="0" /> + <edge from-layer="1159" from-port="1" to-layer="1161" to-port="0" /> + <edge from-layer="1160" from-port="0" to-layer="1161" to-port="1" /> + <edge from-layer="1161" from-port="2" to-layer="1165" to-port="1" /> + <edge from-layer="1161" from-port="2" to-layer="1171" to-port="2" /> + <edge from-layer="1162" from-port="0" to-layer="1165" to-port="2" /> + <edge from-layer="1163" from-port="0" to-layer="1165" to-port="3" /> + <edge from-layer="1164" from-port="0" to-layer="1165" to-port="4" /> + <edge from-layer="1165" from-port="5" to-layer="1167" to-port="0" /> + <edge from-layer="1166" from-port="0" to-layer="1167" to-port="1" /> + <edge from-layer="1167" from-port="2" to-layer="1172" to-port="0" /> + <edge from-layer="1168" from-port="0" to-layer="1171" to-port="1" /> + <edge from-layer="1169" from-port="0" to-layer="1171" to-port="3" /> + <edge from-layer="1170" from-port="0" to-layer="1171" to-port="4" /> + <edge from-layer="1171" from-port="5" to-layer="1172" to-port="1" /> + <edge from-layer="1172" from-port="2" to-layer="1173" to-port="0" /> + <edge from-layer="1173" from-port="2" to-layer="1174" to-port="1" /> + <edge from-layer="1174" from-port="2" to-layer="1235" to-port="0" /> + <edge from-layer="1174" from-port="2" to-layer="1175" to-port="1" /> + <edge from-layer="1175" from-port="2" to-layer="11158" to-port="0" /> + <edge from-layer="1175" from-port="2" to-layer="1177" to-port="0" /> + <edge from-layer="1175" from-port="2" to-layer="1176" to-port="0" /> + <edge from-layer="1176" from-port="2" to-layer="1186" to-port="0" /> + <edge from-layer="1177" from-port="1" to-layer="1184" to-port="0" /> + <edge from-layer="1177" from-port="1" to-layer="1180" to-port="0" /> + <edge from-layer="1178" from-port="0" to-layer="1180" to-port="1" /> + <edge from-layer="1179" from-port="0" to-layer="1180" to-port="2" /> + <edge from-layer="1180" from-port="3" to-layer="1185" to-port="0" /> + <edge from-layer="1181" from-port="0" to-layer="1185" to-port="1" /> + <edge from-layer="1182" from-port="0" to-layer="1184" to-port="1" /> + <edge from-layer="1183" from-port="0" to-layer="1184" to-port="2" /> + <edge from-layer="1184" from-port="3" to-layer="1185" to-port="2" /> + <edge from-layer="1185" from-port="3" to-layer="1186" to-port="1" /> + <edge from-layer="1186" from-port="2" to-layer="1188" to-port="0" /> + <edge from-layer="1187" from-port="0" to-layer="1188" to-port="1" /> + <edge from-layer="1188" from-port="2" to-layer="1243" to-port="1" /> + <edge from-layer="1189" from-port="0" to-layer="1194" to-port="0" /> + <edge from-layer="1190" from-port="0" to-layer="1193" to-port="1" /> + <edge from-layer="1191" from-port="0" to-layer="1193" to-port="2" /> + <edge from-layer="1192" from-port="0" to-layer="1193" to-port="3" /> + <edge from-layer="1193" from-port="4" to-layer="1194" to-port="1" /> + <edge from-layer="1194" from-port="2" to-layer="1195" to-port="0" /> + <edge from-layer="1195" from-port="1" to-layer="1197" to-port="0" /> + <edge from-layer="1196" from-port="0" to-layer="1197" to-port="2" /> + <edge from-layer="1197" from-port="3" to-layer="1216" to-port="0" /> + <edge from-layer="1198" from-port="0" to-layer="1199" to-port="0" /> + <edge from-layer="1199" from-port="1" to-layer="1202" to-port="0" /> + <edge from-layer="1200" from-port="0" to-layer="1201" to-port="0" /> + <edge from-layer="1201" from-port="1" to-layer="1202" to-port="1" /> + <edge from-layer="1202" from-port="2" to-layer="1204" to-port="0" /> + <edge from-layer="1203" from-port="0" to-layer="1204" to-port="1" /> + <edge from-layer="1204" from-port="2" to-layer="1206" to-port="0" /> + <edge from-layer="1205" from-port="0" to-layer="1206" to-port="1" /> + <edge from-layer="1206" from-port="2" to-layer="1207" to-port="0" /> + <edge from-layer="1207" from-port="1" to-layer="1208" to-port="1" /> + <edge from-layer="1208" from-port="2" to-layer="1211" to-port="0" /> + <edge from-layer="1209" from-port="0" to-layer="1210" to-port="0" /> + <edge from-layer="1210" from-port="1" to-layer="1211" to-port="1" /> + <edge from-layer="1211" from-port="2" to-layer="1213" to-port="0" /> + <edge from-layer="1212" from-port="0" to-layer="1213" to-port="1" /> + <edge from-layer="1213" from-port="2" to-layer="1215" to-port="0" /> + <edge from-layer="1214" from-port="0" to-layer="1215" to-port="1" /> + <edge from-layer="1215" from-port="2" to-layer="1216" to-port="1" /> + <edge from-layer="1216" from-port="2" to-layer="1218" to-port="0" /> + <edge from-layer="1216" from-port="2" to-layer="1217" to-port="0" /> + <edge from-layer="1216" from-port="2" to-layer="11157" to-port="0" /> + <edge from-layer="1217" from-port="2" to-layer="1227" to-port="0" /> + <edge from-layer="1218" from-port="1" to-layer="1221" to-port="0" /> + <edge from-layer="1218" from-port="1" to-layer="1225" to-port="0" /> + <edge from-layer="1219" from-port="0" to-layer="1221" to-port="1" /> + <edge from-layer="1220" from-port="0" to-layer="1221" to-port="2" /> + <edge from-layer="1221" from-port="3" to-layer="1226" to-port="1" /> + <edge from-layer="1222" from-port="0" to-layer="1226" to-port="2" /> + <edge from-layer="1223" from-port="0" to-layer="1225" to-port="1" /> + <edge from-layer="1224" from-port="0" to-layer="1225" to-port="2" /> + <edge from-layer="1225" from-port="3" to-layer="1226" to-port="3" /> + <edge from-layer="1226" from-port="4" to-layer="1227" to-port="1" /> + <edge from-layer="1227" from-port="2" to-layer="1229" to-port="0" /> + <edge from-layer="1228" from-port="0" to-layer="1229" to-port="1" /> + <edge from-layer="1229" from-port="2" to-layer="1243" to-port="2" /> + <edge from-layer="1230" from-port="0" to-layer="1242" to-port="1" /> + <edge from-layer="1231" from-port="1" to-layer="1234" to-port="0" /> + <edge from-layer="1232" from-port="0" to-layer="1234" to-port="1" /> + <edge from-layer="1233" from-port="0" to-layer="1234" to-port="2" /> + <edge from-layer="1234" from-port="3" to-layer="1239" to-port="0" /> + <edge from-layer="1235" from-port="1" to-layer="1238" to-port="0" /> + <edge from-layer="1236" from-port="0" to-layer="1238" to-port="1" /> + <edge from-layer="1237" from-port="0" to-layer="1238" to-port="2" /> + <edge from-layer="1238" from-port="3" to-layer="1239" to-port="1" /> + <edge from-layer="1239" from-port="2" to-layer="1242" to-port="2" /> + <edge from-layer="1240" from-port="0" to-layer="1242" to-port="3" /> + <edge from-layer="1241" from-port="0" to-layer="1242" to-port="4" /> + <edge from-layer="1242" from-port="5" to-layer="1243" to-port="3" /> + <edge from-layer="1243" from-port="4" to-layer="1245" to-port="0" /> + <edge from-layer="1244" from-port="0" to-layer="1245" to-port="1" /> + <edge from-layer="1245" from-port="2" to-layer="1247" to-port="0" /> + <edge from-layer="1246" from-port="0" to-layer="1247" to-port="1" /> + <edge from-layer="1247" from-port="2" to-layer="1258" to-port="0" /> + <edge from-layer="1248" from-port="0" to-layer="1249" to-port="0" /> + <edge from-layer="1249" from-port="1" to-layer="1252" to-port="0" /> + <edge from-layer="1250" from-port="0" to-layer="1251" to-port="0" /> + <edge from-layer="1251" from-port="1" to-layer="1252" to-port="1" /> + <edge from-layer="1252" from-port="2" to-layer="1254" to-port="0" /> + <edge from-layer="1253" from-port="0" to-layer="1254" to-port="1" /> + <edge from-layer="1254" from-port="2" to-layer="1256" to-port="0" /> + <edge from-layer="1255" from-port="0" to-layer="1256" to-port="1" /> + <edge from-layer="1256" from-port="2" to-layer="1257" to-port="0" /> + <edge from-layer="1257" from-port="1" to-layer="1258" to-port="1" /> + <edge from-layer="1258" from-port="2" to-layer="1259" to-port="1" /> + <edge from-layer="1259" from-port="2" to-layer="1270" to-port="0" /> + <edge from-layer="1259" from-port="2" to-layer="1263" to-port="0" /> + <edge from-layer="1259" from-port="2" to-layer="1307" to-port="0" /> + <edge from-layer="1260" from-port="0" to-layer="1271" to-port="0" /> + <edge from-layer="1261" from-port="0" to-layer="1269" to-port="0" /> + <edge from-layer="1262" from-port="0" to-layer="1263" to-port="1" /> + <edge from-layer="1263" from-port="2" to-layer="1265" to-port="0" /> + <edge from-layer="1264" from-port="0" to-layer="1265" to-port="1" /> + <edge from-layer="1265" from-port="2" to-layer="1267" to-port="0" /> + <edge from-layer="1266" from-port="0" to-layer="1267" to-port="1" /> + <edge from-layer="1267" from-port="2" to-layer="1268" to-port="0" /> + <edge from-layer="1268" from-port="1" to-layer="1269" to-port="1" /> + <edge from-layer="1269" from-port="2" to-layer="1270" to-port="1" /> + <edge from-layer="1270" from-port="2" to-layer="1271" to-port="1" /> + <edge from-layer="1271" from-port="2" to-layer="1294" to-port="0" /> + <edge from-layer="1271" from-port="2" to-layer="1282" to-port="0" /> + <edge from-layer="1272" from-port="0" to-layer="1273" to-port="0" /> + <edge from-layer="1273" from-port="1" to-layer="1276" to-port="0" /> + <edge from-layer="1274" from-port="0" to-layer="1275" to-port="0" /> + <edge from-layer="1275" from-port="1" to-layer="1276" to-port="1" /> + <edge from-layer="1276" from-port="2" to-layer="1278" to-port="0" /> + <edge from-layer="1277" from-port="0" to-layer="1278" to-port="1" /> + <edge from-layer="1278" from-port="2" to-layer="1280" to-port="0" /> + <edge from-layer="1279" from-port="0" to-layer="1280" to-port="1" /> + <edge from-layer="1280" from-port="2" to-layer="1281" to-port="0" /> + <edge from-layer="1281" from-port="1" to-layer="1282" to-port="1" /> + <edge from-layer="1282" from-port="2" to-layer="1283" to-port="0" /> + <edge from-layer="1283" from-port="1" to-layer="1295" to-port="0" /> + <edge from-layer="1284" from-port="0" to-layer="1285" to-port="0" /> + <edge from-layer="1285" from-port="1" to-layer="1288" to-port="0" /> + <edge from-layer="1286" from-port="0" to-layer="1287" to-port="0" /> + <edge from-layer="1287" from-port="1" to-layer="1288" to-port="1" /> + <edge from-layer="1288" from-port="2" to-layer="1290" to-port="0" /> + <edge from-layer="1289" from-port="0" to-layer="1290" to-port="1" /> + <edge from-layer="1290" from-port="2" to-layer="1292" to-port="0" /> + <edge from-layer="1291" from-port="0" to-layer="1292" to-port="1" /> + <edge from-layer="1292" from-port="2" to-layer="1293" to-port="0" /> + <edge from-layer="1293" from-port="1" to-layer="1294" to-port="1" /> + <edge from-layer="1294" from-port="2" to-layer="1295" to-port="1" /> + <edge from-layer="1295" from-port="2" to-layer="1306" to-port="0" /> + <edge from-layer="1296" from-port="0" to-layer="1297" to-port="0" /> + <edge from-layer="1297" from-port="1" to-layer="1300" to-port="0" /> + <edge from-layer="1298" from-port="0" to-layer="1299" to-port="0" /> + <edge from-layer="1299" from-port="1" to-layer="1300" to-port="1" /> + <edge from-layer="1300" from-port="2" to-layer="1302" to-port="0" /> + <edge from-layer="1301" from-port="0" to-layer="1302" to-port="1" /> + <edge from-layer="1302" from-port="2" to-layer="1304" to-port="0" /> + <edge from-layer="1303" from-port="0" to-layer="1304" to-port="1" /> + <edge from-layer="1304" from-port="2" to-layer="1305" to-port="0" /> + <edge from-layer="1305" from-port="1" to-layer="1306" to-port="1" /> + <edge from-layer="1306" from-port="2" to-layer="1307" to-port="1" /> + <edge from-layer="1307" from-port="2" to-layer="1491" to-port="0" /> + <edge from-layer="1307" from-port="2" to-layer="1311" to-port="0" /> + <edge from-layer="1307" from-port="2" to-layer="1318" to-port="0" /> + <edge from-layer="1308" from-port="0" to-layer="1319" to-port="0" /> + <edge from-layer="1309" from-port="0" to-layer="1317" to-port="0" /> + <edge from-layer="1310" from-port="0" to-layer="1311" to-port="1" /> + <edge from-layer="1311" from-port="2" to-layer="1313" to-port="0" /> + <edge from-layer="1312" from-port="0" to-layer="1313" to-port="1" /> + <edge from-layer="1313" from-port="2" to-layer="1315" to-port="0" /> + <edge from-layer="1314" from-port="0" to-layer="1315" to-port="1" /> + <edge from-layer="1315" from-port="2" to-layer="1316" to-port="0" /> + <edge from-layer="1316" from-port="1" to-layer="1317" to-port="1" /> + <edge from-layer="1317" from-port="2" to-layer="1318" to-port="1" /> + <edge from-layer="1318" from-port="2" to-layer="1319" to-port="1" /> + <edge from-layer="1319" from-port="2" to-layer="1330" to-port="0" /> + <edge from-layer="1319" from-port="2" to-layer="1378" to-port="0" /> + <edge from-layer="1319" from-port="2" to-layer="1440" to-port="0" /> + <edge from-layer="1320" from-port="0" to-layer="1321" to-port="0" /> + <edge from-layer="1321" from-port="1" to-layer="1324" to-port="0" /> + <edge from-layer="1322" from-port="0" to-layer="1323" to-port="0" /> + <edge from-layer="1323" from-port="1" to-layer="1324" to-port="1" /> + <edge from-layer="1324" from-port="2" to-layer="1326" to-port="0" /> + <edge from-layer="1325" from-port="0" to-layer="1326" to-port="1" /> + <edge from-layer="1326" from-port="2" to-layer="1328" to-port="0" /> + <edge from-layer="1327" from-port="0" to-layer="1328" to-port="1" /> + <edge from-layer="1328" from-port="2" to-layer="1329" to-port="0" /> + <edge from-layer="1329" from-port="1" to-layer="1330" to-port="1" /> + <edge from-layer="1330" from-port="2" to-layer="1333" to-port="0" /> + <edge from-layer="1331" from-port="0" to-layer="1332" to-port="0" /> + <edge from-layer="1332" from-port="1" to-layer="1333" to-port="1" /> + <edge from-layer="1333" from-port="2" to-layer="1335" to-port="0" /> + <edge from-layer="1334" from-port="0" to-layer="1335" to-port="1" /> + <edge from-layer="1335" from-port="2" to-layer="1337" to-port="0" /> + <edge from-layer="1336" from-port="0" to-layer="1337" to-port="1" /> + <edge from-layer="1337" from-port="2" to-layer="1349" to-port="0" /> + <edge from-layer="1337" from-port="2" to-layer="1339" to-port="0" /> + <edge from-layer="1337" from-port="2" to-layer="1338" to-port="0" /> + <edge from-layer="1337" from-port="2" to-layer="1355" to-port="0" /> + <edge from-layer="1338" from-port="2" to-layer="1358" to-port="0" /> + <edge from-layer="1339" from-port="1" to-layer="1341" to-port="0" /> + <edge from-layer="1340" from-port="0" to-layer="1341" to-port="2" /> + <edge from-layer="1341" from-port="3" to-layer="1342" to-port="0" /> + <edge from-layer="1342" from-port="2" to-layer="1343" to-port="0" /> + <edge from-layer="1343" from-port="1" to-layer="1345" to-port="0" /> + <edge from-layer="1344" from-port="0" to-layer="1345" to-port="1" /> + <edge from-layer="1345" from-port="2" to-layer="1355" to-port="2" /> + <edge from-layer="1345" from-port="2" to-layer="1349" to-port="1" /> + <edge from-layer="1346" from-port="0" to-layer="1349" to-port="2" /> + <edge from-layer="1347" from-port="0" to-layer="1349" to-port="3" /> + <edge from-layer="1348" from-port="0" to-layer="1349" to-port="4" /> + <edge from-layer="1349" from-port="5" to-layer="1351" to-port="0" /> + <edge from-layer="1350" from-port="0" to-layer="1351" to-port="1" /> + <edge from-layer="1351" from-port="2" to-layer="1356" to-port="0" /> + <edge from-layer="1352" from-port="0" to-layer="1355" to-port="1" /> + <edge from-layer="1353" from-port="0" to-layer="1355" to-port="3" /> + <edge from-layer="1354" from-port="0" to-layer="1355" to-port="4" /> + <edge from-layer="1355" from-port="5" to-layer="1356" to-port="1" /> + <edge from-layer="1356" from-port="2" to-layer="1357" to-port="0" /> + <edge from-layer="1357" from-port="2" to-layer="1358" to-port="1" /> + <edge from-layer="1358" from-port="2" to-layer="1475" to-port="0" /> + <edge from-layer="1359" from-port="0" to-layer="1364" to-port="0" /> + <edge from-layer="1360" from-port="0" to-layer="1363" to-port="1" /> + <edge from-layer="1361" from-port="0" to-layer="1363" to-port="2" /> + <edge from-layer="1362" from-port="0" to-layer="1363" to-port="3" /> + <edge from-layer="1363" from-port="4" to-layer="1364" to-port="1" /> + <edge from-layer="1364" from-port="2" to-layer="1365" to-port="0" /> + <edge from-layer="1365" from-port="1" to-layer="1367" to-port="0" /> + <edge from-layer="1366" from-port="0" to-layer="1367" to-port="2" /> + <edge from-layer="1367" from-port="3" to-layer="1463" to-port="0" /> + <edge from-layer="1367" from-port="3" to-layer="1407" to-port="0" /> + <edge from-layer="1368" from-port="0" to-layer="1369" to-port="0" /> + <edge from-layer="1369" from-port="1" to-layer="1372" to-port="0" /> + <edge from-layer="1370" from-port="0" to-layer="1371" to-port="0" /> + <edge from-layer="1371" from-port="1" to-layer="1372" to-port="1" /> + <edge from-layer="1372" from-port="2" to-layer="1374" to-port="0" /> + <edge from-layer="1373" from-port="0" to-layer="1374" to-port="1" /> + <edge from-layer="1374" from-port="2" to-layer="1376" to-port="0" /> + <edge from-layer="1375" from-port="0" to-layer="1376" to-port="1" /> + <edge from-layer="1376" from-port="2" to-layer="1377" to-port="0" /> + <edge from-layer="1377" from-port="1" to-layer="1378" to-port="1" /> + <edge from-layer="1378" from-port="2" to-layer="1381" to-port="0" /> + <edge from-layer="1379" from-port="0" to-layer="1380" to-port="0" /> + <edge from-layer="1380" from-port="1" to-layer="1381" to-port="1" /> + <edge from-layer="1381" from-port="2" to-layer="1383" to-port="0" /> + <edge from-layer="1382" from-port="0" to-layer="1383" to-port="1" /> + <edge from-layer="1383" from-port="2" to-layer="1385" to-port="0" /> + <edge from-layer="1384" from-port="0" to-layer="1385" to-port="1" /> + <edge from-layer="1385" from-port="2" to-layer="1397" to-port="0" /> + <edge from-layer="1385" from-port="2" to-layer="1387" to-port="0" /> + <edge from-layer="1385" from-port="2" to-layer="1386" to-port="0" /> + <edge from-layer="1385" from-port="2" to-layer="1403" to-port="0" /> + <edge from-layer="1386" from-port="2" to-layer="1406" to-port="0" /> + <edge from-layer="1387" from-port="1" to-layer="1389" to-port="0" /> + <edge from-layer="1388" from-port="0" to-layer="1389" to-port="2" /> + <edge from-layer="1389" from-port="3" to-layer="1390" to-port="0" /> + <edge from-layer="1390" from-port="2" to-layer="1391" to-port="0" /> + <edge from-layer="1391" from-port="1" to-layer="1393" to-port="0" /> + <edge from-layer="1392" from-port="0" to-layer="1393" to-port="1" /> + <edge from-layer="1393" from-port="2" to-layer="1403" to-port="2" /> + <edge from-layer="1393" from-port="2" to-layer="1397" to-port="1" /> + <edge from-layer="1394" from-port="0" to-layer="1397" to-port="2" /> + <edge from-layer="1395" from-port="0" to-layer="1397" to-port="3" /> + <edge from-layer="1396" from-port="0" to-layer="1397" to-port="4" /> + <edge from-layer="1397" from-port="5" to-layer="1399" to-port="0" /> + <edge from-layer="1398" from-port="0" to-layer="1399" to-port="1" /> + <edge from-layer="1399" from-port="2" to-layer="1404" to-port="0" /> + <edge from-layer="1400" from-port="0" to-layer="1403" to-port="1" /> + <edge from-layer="1401" from-port="0" to-layer="1403" to-port="3" /> + <edge from-layer="1402" from-port="0" to-layer="1403" to-port="4" /> + <edge from-layer="1403" from-port="5" to-layer="1404" to-port="1" /> + <edge from-layer="1404" from-port="2" to-layer="1405" to-port="0" /> + <edge from-layer="1405" from-port="2" to-layer="1406" to-port="1" /> + <edge from-layer="1406" from-port="2" to-layer="1467" to-port="0" /> + <edge from-layer="1406" from-port="2" to-layer="1407" to-port="1" /> + <edge from-layer="1407" from-port="2" to-layer="2324" to-port="0" /> + <edge from-layer="1407" from-port="2" to-layer="1409" to-port="0" /> + <edge from-layer="1407" from-port="2" to-layer="1408" to-port="0" /> + <edge from-layer="1408" from-port="2" to-layer="1418" to-port="0" /> + <edge from-layer="1409" from-port="1" to-layer="1412" to-port="0" /> + <edge from-layer="1409" from-port="1" to-layer="1416" to-port="0" /> + <edge from-layer="1410" from-port="0" to-layer="1412" to-port="1" /> + <edge from-layer="1411" from-port="0" to-layer="1412" to-port="2" /> + <edge from-layer="1412" from-port="3" to-layer="1417" to-port="0" /> + <edge from-layer="1413" from-port="0" to-layer="1417" to-port="1" /> + <edge from-layer="1414" from-port="0" to-layer="1416" to-port="1" /> + <edge from-layer="1415" from-port="0" to-layer="1416" to-port="2" /> + <edge from-layer="1416" from-port="3" to-layer="1417" to-port="2" /> + <edge from-layer="1417" from-port="3" to-layer="1418" to-port="1" /> + <edge from-layer="1418" from-port="2" to-layer="1420" to-port="0" /> + <edge from-layer="1419" from-port="0" to-layer="1420" to-port="1" /> + <edge from-layer="1420" from-port="2" to-layer="1475" to-port="1" /> + <edge from-layer="1421" from-port="0" to-layer="1426" to-port="0" /> + <edge from-layer="1422" from-port="0" to-layer="1425" to-port="1" /> + <edge from-layer="1423" from-port="0" to-layer="1425" to-port="2" /> + <edge from-layer="1424" from-port="0" to-layer="1425" to-port="3" /> + <edge from-layer="1425" from-port="4" to-layer="1426" to-port="1" /> + <edge from-layer="1426" from-port="2" to-layer="1427" to-port="0" /> + <edge from-layer="1427" from-port="1" to-layer="1429" to-port="0" /> + <edge from-layer="1428" from-port="0" to-layer="1429" to-port="2" /> + <edge from-layer="1429" from-port="3" to-layer="1448" to-port="0" /> + <edge from-layer="1430" from-port="0" to-layer="1431" to-port="0" /> + <edge from-layer="1431" from-port="1" to-layer="1434" to-port="0" /> + <edge from-layer="1432" from-port="0" to-layer="1433" to-port="0" /> + <edge from-layer="1433" from-port="1" to-layer="1434" to-port="1" /> + <edge from-layer="1434" from-port="2" to-layer="1436" to-port="0" /> + <edge from-layer="1435" from-port="0" to-layer="1436" to-port="1" /> + <edge from-layer="1436" from-port="2" to-layer="1438" to-port="0" /> + <edge from-layer="1437" from-port="0" to-layer="1438" to-port="1" /> + <edge from-layer="1438" from-port="2" to-layer="1439" to-port="0" /> + <edge from-layer="1439" from-port="1" to-layer="1440" to-port="1" /> + <edge from-layer="1440" from-port="2" to-layer="1443" to-port="0" /> + <edge from-layer="1441" from-port="0" to-layer="1442" to-port="0" /> + <edge from-layer="1442" from-port="1" to-layer="1443" to-port="1" /> + <edge from-layer="1443" from-port="2" to-layer="1445" to-port="0" /> + <edge from-layer="1444" from-port="0" to-layer="1445" to-port="1" /> + <edge from-layer="1445" from-port="2" to-layer="1447" to-port="0" /> + <edge from-layer="1446" from-port="0" to-layer="1447" to-port="1" /> + <edge from-layer="1447" from-port="2" to-layer="1448" to-port="1" /> + <edge from-layer="1448" from-port="2" to-layer="2323" to-port="0" /> + <edge from-layer="1448" from-port="2" to-layer="1450" to-port="0" /> + <edge from-layer="1448" from-port="2" to-layer="1449" to-port="0" /> + <edge from-layer="1449" from-port="2" to-layer="1459" to-port="0" /> + <edge from-layer="1450" from-port="1" to-layer="1453" to-port="0" /> + <edge from-layer="1450" from-port="1" to-layer="1457" to-port="0" /> + <edge from-layer="1451" from-port="0" to-layer="1453" to-port="1" /> + <edge from-layer="1452" from-port="0" to-layer="1453" to-port="2" /> + <edge from-layer="1453" from-port="3" to-layer="1458" to-port="1" /> + <edge from-layer="1454" from-port="0" to-layer="1458" to-port="2" /> + <edge from-layer="1455" from-port="0" to-layer="1457" to-port="1" /> + <edge from-layer="1456" from-port="0" to-layer="1457" to-port="2" /> + <edge from-layer="1457" from-port="3" to-layer="1458" to-port="3" /> + <edge from-layer="1458" from-port="4" to-layer="1459" to-port="1" /> + <edge from-layer="1459" from-port="2" to-layer="1461" to-port="0" /> + <edge from-layer="1460" from-port="0" to-layer="1461" to-port="1" /> + <edge from-layer="1461" from-port="2" to-layer="1475" to-port="2" /> + <edge from-layer="1462" from-port="0" to-layer="1474" to-port="1" /> + <edge from-layer="1463" from-port="1" to-layer="1466" to-port="0" /> + <edge from-layer="1464" from-port="0" to-layer="1466" to-port="1" /> + <edge from-layer="1465" from-port="0" to-layer="1466" to-port="2" /> + <edge from-layer="1466" from-port="3" to-layer="1471" to-port="0" /> + <edge from-layer="1467" from-port="1" to-layer="1470" to-port="0" /> + <edge from-layer="1468" from-port="0" to-layer="1470" to-port="1" /> + <edge from-layer="1469" from-port="0" to-layer="1470" to-port="2" /> + <edge from-layer="1470" from-port="3" to-layer="1471" to-port="1" /> + <edge from-layer="1471" from-port="2" to-layer="1474" to-port="2" /> + <edge from-layer="1472" from-port="0" to-layer="1474" to-port="3" /> + <edge from-layer="1473" from-port="0" to-layer="1474" to-port="4" /> + <edge from-layer="1474" from-port="5" to-layer="1475" to-port="3" /> + <edge from-layer="1475" from-port="4" to-layer="1477" to-port="0" /> + <edge from-layer="1476" from-port="0" to-layer="1477" to-port="1" /> + <edge from-layer="1477" from-port="2" to-layer="1479" to-port="0" /> + <edge from-layer="1478" from-port="0" to-layer="1479" to-port="1" /> + <edge from-layer="1479" from-port="2" to-layer="1490" to-port="0" /> + <edge from-layer="1480" from-port="0" to-layer="1481" to-port="0" /> + <edge from-layer="1481" from-port="1" to-layer="1484" to-port="0" /> + <edge from-layer="1482" from-port="0" to-layer="1483" to-port="0" /> + <edge from-layer="1483" from-port="1" to-layer="1484" to-port="1" /> + <edge from-layer="1484" from-port="2" to-layer="1486" to-port="0" /> + <edge from-layer="1485" from-port="0" to-layer="1486" to-port="1" /> + <edge from-layer="1486" from-port="2" to-layer="1488" to-port="0" /> + <edge from-layer="1487" from-port="0" to-layer="1488" to-port="1" /> + <edge from-layer="1488" from-port="2" to-layer="1489" to-port="0" /> + <edge from-layer="1489" from-port="1" to-layer="1490" to-port="1" /> + <edge from-layer="1490" from-port="2" to-layer="1491" to-port="1" /> + <edge from-layer="1491" from-port="2" to-layer="1495" to-port="0" /> + <edge from-layer="1491" from-port="2" to-layer="1539" to-port="0" /> + <edge from-layer="1491" from-port="2" to-layer="1502" to-port="0" /> + <edge from-layer="1492" from-port="0" to-layer="1503" to-port="0" /> + <edge from-layer="1493" from-port="0" to-layer="1501" to-port="0" /> + <edge from-layer="1494" from-port="0" to-layer="1495" to-port="1" /> + <edge from-layer="1495" from-port="2" to-layer="1497" to-port="0" /> + <edge from-layer="1496" from-port="0" to-layer="1497" to-port="1" /> + <edge from-layer="1497" from-port="2" to-layer="1499" to-port="0" /> + <edge from-layer="1498" from-port="0" to-layer="1499" to-port="1" /> + <edge from-layer="1499" from-port="2" to-layer="1500" to-port="0" /> + <edge from-layer="1500" from-port="1" to-layer="1501" to-port="1" /> + <edge from-layer="1501" from-port="2" to-layer="1502" to-port="1" /> + <edge from-layer="1502" from-port="2" to-layer="1503" to-port="1" /> + <edge from-layer="1503" from-port="2" to-layer="1526" to-port="0" /> + <edge from-layer="1503" from-port="2" to-layer="1514" to-port="0" /> + <edge from-layer="1504" from-port="0" to-layer="1505" to-port="0" /> + <edge from-layer="1505" from-port="1" to-layer="1508" to-port="0" /> + <edge from-layer="1506" from-port="0" to-layer="1507" to-port="0" /> + <edge from-layer="1507" from-port="1" to-layer="1508" to-port="1" /> + <edge from-layer="1508" from-port="2" to-layer="1510" to-port="0" /> + <edge from-layer="1509" from-port="0" to-layer="1510" to-port="1" /> + <edge from-layer="1510" from-port="2" to-layer="1512" to-port="0" /> + <edge from-layer="1511" from-port="0" to-layer="1512" to-port="1" /> + <edge from-layer="1512" from-port="2" to-layer="1513" to-port="0" /> + <edge from-layer="1513" from-port="1" to-layer="1514" to-port="1" /> + <edge from-layer="1514" from-port="2" to-layer="1515" to-port="0" /> + <edge from-layer="1515" from-port="1" to-layer="1527" to-port="0" /> + <edge from-layer="1516" from-port="0" to-layer="1517" to-port="0" /> + <edge from-layer="1517" from-port="1" to-layer="1520" to-port="0" /> + <edge from-layer="1518" from-port="0" to-layer="1519" to-port="0" /> + <edge from-layer="1519" from-port="1" to-layer="1520" to-port="1" /> + <edge from-layer="1520" from-port="2" to-layer="1522" to-port="0" /> + <edge from-layer="1521" from-port="0" to-layer="1522" to-port="1" /> + <edge from-layer="1522" from-port="2" to-layer="1524" to-port="0" /> + <edge from-layer="1523" from-port="0" to-layer="1524" to-port="1" /> + <edge from-layer="1524" from-port="2" to-layer="1525" to-port="0" /> + <edge from-layer="1525" from-port="1" to-layer="1526" to-port="1" /> + <edge from-layer="1526" from-port="2" to-layer="1527" to-port="1" /> + <edge from-layer="1527" from-port="2" to-layer="1538" to-port="0" /> + <edge from-layer="1528" from-port="0" to-layer="1529" to-port="0" /> + <edge from-layer="1529" from-port="1" to-layer="1532" to-port="0" /> + <edge from-layer="1530" from-port="0" to-layer="1531" to-port="0" /> + <edge from-layer="1531" from-port="1" to-layer="1532" to-port="1" /> + <edge from-layer="1532" from-port="2" to-layer="1534" to-port="0" /> + <edge from-layer="1533" from-port="0" to-layer="1534" to-port="1" /> + <edge from-layer="1534" from-port="2" to-layer="1536" to-port="0" /> + <edge from-layer="1535" from-port="0" to-layer="1536" to-port="1" /> + <edge from-layer="1536" from-port="2" to-layer="1537" to-port="0" /> + <edge from-layer="1537" from-port="1" to-layer="1538" to-port="1" /> + <edge from-layer="1538" from-port="2" to-layer="1539" to-port="1" /> + <edge from-layer="1539" from-port="2" to-layer="1550" to-port="0" /> + <edge from-layer="1539" from-port="2" to-layer="1723" to-port="0" /> + <edge from-layer="1539" from-port="2" to-layer="1543" to-port="0" /> + <edge from-layer="1540" from-port="0" to-layer="1551" to-port="0" /> + <edge from-layer="1541" from-port="0" to-layer="1549" to-port="0" /> + <edge from-layer="1542" from-port="0" to-layer="1543" to-port="1" /> + <edge from-layer="1543" from-port="2" to-layer="1545" to-port="0" /> + <edge from-layer="1544" from-port="0" to-layer="1545" to-port="1" /> + <edge from-layer="1545" from-port="2" to-layer="1547" to-port="0" /> + <edge from-layer="1546" from-port="0" to-layer="1547" to-port="1" /> + <edge from-layer="1547" from-port="2" to-layer="1548" to-port="0" /> + <edge from-layer="1548" from-port="1" to-layer="1549" to-port="1" /> + <edge from-layer="1549" from-port="2" to-layer="1550" to-port="1" /> + <edge from-layer="1550" from-port="2" to-layer="1551" to-port="1" /> + <edge from-layer="1551" from-port="2" to-layer="1562" to-port="0" /> + <edge from-layer="1551" from-port="2" to-layer="1610" to-port="0" /> + <edge from-layer="1551" from-port="2" to-layer="1672" to-port="0" /> + <edge from-layer="1552" from-port="0" to-layer="1553" to-port="0" /> + <edge from-layer="1553" from-port="1" to-layer="1556" to-port="0" /> + <edge from-layer="1554" from-port="0" to-layer="1555" to-port="0" /> + <edge from-layer="1555" from-port="1" to-layer="1556" to-port="1" /> + <edge from-layer="1556" from-port="2" to-layer="1558" to-port="0" /> + <edge from-layer="1557" from-port="0" to-layer="1558" to-port="1" /> + <edge from-layer="1558" from-port="2" to-layer="1560" to-port="0" /> + <edge from-layer="1559" from-port="0" to-layer="1560" to-port="1" /> + <edge from-layer="1560" from-port="2" to-layer="1561" to-port="0" /> + <edge from-layer="1561" from-port="1" to-layer="1562" to-port="1" /> + <edge from-layer="1562" from-port="2" to-layer="1565" to-port="0" /> + <edge from-layer="1563" from-port="0" to-layer="1564" to-port="0" /> + <edge from-layer="1564" from-port="1" to-layer="1565" to-port="1" /> + <edge from-layer="1565" from-port="2" to-layer="1567" to-port="0" /> + <edge from-layer="1566" from-port="0" to-layer="1567" to-port="1" /> + <edge from-layer="1567" from-port="2" to-layer="1569" to-port="0" /> + <edge from-layer="1568" from-port="0" to-layer="1569" to-port="1" /> + <edge from-layer="1569" from-port="2" to-layer="1587" to-port="0" /> + <edge from-layer="1569" from-port="2" to-layer="1570" to-port="0" /> + <edge from-layer="1569" from-port="2" to-layer="1571" to-port="0" /> + <edge from-layer="1569" from-port="2" to-layer="1581" to-port="0" /> + <edge from-layer="1570" from-port="2" to-layer="1590" to-port="0" /> + <edge from-layer="1571" from-port="1" to-layer="1573" to-port="0" /> + <edge from-layer="1572" from-port="0" to-layer="1573" to-port="2" /> + <edge from-layer="1573" from-port="3" to-layer="1574" to-port="0" /> + <edge from-layer="1574" from-port="2" to-layer="1575" to-port="0" /> + <edge from-layer="1575" from-port="1" to-layer="1577" to-port="0" /> + <edge from-layer="1576" from-port="0" to-layer="1577" to-port="1" /> + <edge from-layer="1577" from-port="2" to-layer="1581" to-port="1" /> + <edge from-layer="1577" from-port="2" to-layer="1587" to-port="2" /> + <edge from-layer="1578" from-port="0" to-layer="1581" to-port="2" /> + <edge from-layer="1579" from-port="0" to-layer="1581" to-port="3" /> + <edge from-layer="1580" from-port="0" to-layer="1581" to-port="4" /> + <edge from-layer="1581" from-port="5" to-layer="1583" to-port="0" /> + <edge from-layer="1582" from-port="0" to-layer="1583" to-port="1" /> + <edge from-layer="1583" from-port="2" to-layer="1588" to-port="0" /> + <edge from-layer="1584" from-port="0" to-layer="1587" to-port="1" /> + <edge from-layer="1585" from-port="0" to-layer="1587" to-port="3" /> + <edge from-layer="1586" from-port="0" to-layer="1587" to-port="4" /> + <edge from-layer="1587" from-port="5" to-layer="1588" to-port="1" /> + <edge from-layer="1588" from-port="2" to-layer="1589" to-port="0" /> + <edge from-layer="1589" from-port="2" to-layer="1590" to-port="1" /> + <edge from-layer="1590" from-port="2" to-layer="1707" to-port="0" /> + <edge from-layer="1591" from-port="0" to-layer="1596" to-port="0" /> + <edge from-layer="1592" from-port="0" to-layer="1595" to-port="1" /> + <edge from-layer="1593" from-port="0" to-layer="1595" to-port="2" /> + <edge from-layer="1594" from-port="0" to-layer="1595" to-port="3" /> + <edge from-layer="1595" from-port="4" to-layer="1596" to-port="1" /> + <edge from-layer="1596" from-port="2" to-layer="1597" to-port="0" /> + <edge from-layer="1597" from-port="1" to-layer="1599" to-port="0" /> + <edge from-layer="1598" from-port="0" to-layer="1599" to-port="2" /> + <edge from-layer="1599" from-port="3" to-layer="1695" to-port="0" /> + <edge from-layer="1599" from-port="3" to-layer="1639" to-port="0" /> + <edge from-layer="1600" from-port="0" to-layer="1601" to-port="0" /> + <edge from-layer="1601" from-port="1" to-layer="1604" to-port="0" /> + <edge from-layer="1602" from-port="0" to-layer="1603" to-port="0" /> + <edge from-layer="1603" from-port="1" to-layer="1604" to-port="1" /> + <edge from-layer="1604" from-port="2" to-layer="1606" to-port="0" /> + <edge from-layer="1605" from-port="0" to-layer="1606" to-port="1" /> + <edge from-layer="1606" from-port="2" to-layer="1608" to-port="0" /> + <edge from-layer="1607" from-port="0" to-layer="1608" to-port="1" /> + <edge from-layer="1608" from-port="2" to-layer="1609" to-port="0" /> + <edge from-layer="1609" from-port="1" to-layer="1610" to-port="1" /> + <edge from-layer="1610" from-port="2" to-layer="1613" to-port="0" /> + <edge from-layer="1611" from-port="0" to-layer="1612" to-port="0" /> + <edge from-layer="1612" from-port="1" to-layer="1613" to-port="1" /> + <edge from-layer="1613" from-port="2" to-layer="1615" to-port="0" /> + <edge from-layer="1614" from-port="0" to-layer="1615" to-port="1" /> + <edge from-layer="1615" from-port="2" to-layer="1617" to-port="0" /> + <edge from-layer="1616" from-port="0" to-layer="1617" to-port="1" /> + <edge from-layer="1617" from-port="2" to-layer="1629" to-port="0" /> + <edge from-layer="1617" from-port="2" to-layer="1618" to-port="0" /> + <edge from-layer="1617" from-port="2" to-layer="1619" to-port="0" /> + <edge from-layer="1617" from-port="2" to-layer="1635" to-port="0" /> + <edge from-layer="1618" from-port="2" to-layer="1638" to-port="0" /> + <edge from-layer="1619" from-port="1" to-layer="1621" to-port="0" /> + <edge from-layer="1620" from-port="0" to-layer="1621" to-port="2" /> + <edge from-layer="1621" from-port="3" to-layer="1622" to-port="0" /> + <edge from-layer="1622" from-port="2" to-layer="1623" to-port="0" /> + <edge from-layer="1623" from-port="1" to-layer="1625" to-port="0" /> + <edge from-layer="1624" from-port="0" to-layer="1625" to-port="1" /> + <edge from-layer="1625" from-port="2" to-layer="1635" to-port="2" /> + <edge from-layer="1625" from-port="2" to-layer="1629" to-port="1" /> + <edge from-layer="1626" from-port="0" to-layer="1629" to-port="2" /> + <edge from-layer="1627" from-port="0" to-layer="1629" to-port="3" /> + <edge from-layer="1628" from-port="0" to-layer="1629" to-port="4" /> + <edge from-layer="1629" from-port="5" to-layer="1631" to-port="0" /> + <edge from-layer="1630" from-port="0" to-layer="1631" to-port="1" /> + <edge from-layer="1631" from-port="2" to-layer="1636" to-port="0" /> + <edge from-layer="1632" from-port="0" to-layer="1635" to-port="1" /> + <edge from-layer="1633" from-port="0" to-layer="1635" to-port="3" /> + <edge from-layer="1634" from-port="0" to-layer="1635" to-port="4" /> + <edge from-layer="1635" from-port="5" to-layer="1636" to-port="1" /> + <edge from-layer="1636" from-port="2" to-layer="1637" to-port="0" /> + <edge from-layer="1637" from-port="2" to-layer="1638" to-port="1" /> + <edge from-layer="1638" from-port="2" to-layer="1699" to-port="0" /> + <edge from-layer="1638" from-port="2" to-layer="1639" to-port="1" /> + <edge from-layer="1639" from-port="2" to-layer="1641" to-port="0" /> + <edge from-layer="1639" from-port="2" to-layer="1640" to-port="0" /> + <edge from-layer="1639" from-port="2" to-layer="2322" to-port="0" /> + <edge from-layer="1640" from-port="2" to-layer="1650" to-port="0" /> + <edge from-layer="1641" from-port="1" to-layer="1644" to-port="0" /> + <edge from-layer="1641" from-port="1" to-layer="1648" to-port="0" /> + <edge from-layer="1642" from-port="0" to-layer="1644" to-port="1" /> + <edge from-layer="1643" from-port="0" to-layer="1644" to-port="2" /> + <edge from-layer="1644" from-port="3" to-layer="1649" to-port="0" /> + <edge from-layer="1645" from-port="0" to-layer="1649" to-port="1" /> + <edge from-layer="1646" from-port="0" to-layer="1648" to-port="1" /> + <edge from-layer="1647" from-port="0" to-layer="1648" to-port="2" /> + <edge from-layer="1648" from-port="3" to-layer="1649" to-port="2" /> + <edge from-layer="1649" from-port="3" to-layer="1650" to-port="1" /> + <edge from-layer="1650" from-port="2" to-layer="1652" to-port="0" /> + <edge from-layer="1651" from-port="0" to-layer="1652" to-port="1" /> + <edge from-layer="1652" from-port="2" to-layer="1707" to-port="1" /> + <edge from-layer="1653" from-port="0" to-layer="1658" to-port="0" /> + <edge from-layer="1654" from-port="0" to-layer="1657" to-port="1" /> + <edge from-layer="1655" from-port="0" to-layer="1657" to-port="2" /> + <edge from-layer="1656" from-port="0" to-layer="1657" to-port="3" /> + <edge from-layer="1657" from-port="4" to-layer="1658" to-port="1" /> + <edge from-layer="1658" from-port="2" to-layer="1659" to-port="0" /> + <edge from-layer="1659" from-port="1" to-layer="1661" to-port="0" /> + <edge from-layer="1660" from-port="0" to-layer="1661" to-port="2" /> + <edge from-layer="1661" from-port="3" to-layer="1680" to-port="0" /> + <edge from-layer="1662" from-port="0" to-layer="1663" to-port="0" /> + <edge from-layer="1663" from-port="1" to-layer="1666" to-port="0" /> + <edge from-layer="1664" from-port="0" to-layer="1665" to-port="0" /> + <edge from-layer="1665" from-port="1" to-layer="1666" to-port="1" /> + <edge from-layer="1666" from-port="2" to-layer="1668" to-port="0" /> + <edge from-layer="1667" from-port="0" to-layer="1668" to-port="1" /> + <edge from-layer="1668" from-port="2" to-layer="1670" to-port="0" /> + <edge from-layer="1669" from-port="0" to-layer="1670" to-port="1" /> + <edge from-layer="1670" from-port="2" to-layer="1671" to-port="0" /> + <edge from-layer="1671" from-port="1" to-layer="1672" to-port="1" /> + <edge from-layer="1672" from-port="2" to-layer="1675" to-port="0" /> + <edge from-layer="1673" from-port="0" to-layer="1674" to-port="0" /> + <edge from-layer="1674" from-port="1" to-layer="1675" to-port="1" /> + <edge from-layer="1675" from-port="2" to-layer="1677" to-port="0" /> + <edge from-layer="1676" from-port="0" to-layer="1677" to-port="1" /> + <edge from-layer="1677" from-port="2" to-layer="1679" to-port="0" /> + <edge from-layer="1678" from-port="0" to-layer="1679" to-port="1" /> + <edge from-layer="1679" from-port="2" to-layer="1680" to-port="1" /> + <edge from-layer="1680" from-port="2" to-layer="1681" to-port="0" /> + <edge from-layer="1680" from-port="2" to-layer="1682" to-port="0" /> + <edge from-layer="1680" from-port="2" to-layer="2321" to-port="0" /> + <edge from-layer="1681" from-port="2" to-layer="1691" to-port="0" /> + <edge from-layer="1682" from-port="1" to-layer="1685" to-port="0" /> + <edge from-layer="1682" from-port="1" to-layer="1689" to-port="0" /> + <edge from-layer="1683" from-port="0" to-layer="1685" to-port="1" /> + <edge from-layer="1684" from-port="0" to-layer="1685" to-port="2" /> + <edge from-layer="1685" from-port="3" to-layer="1690" to-port="1" /> + <edge from-layer="1686" from-port="0" to-layer="1690" to-port="2" /> + <edge from-layer="1687" from-port="0" to-layer="1689" to-port="1" /> + <edge from-layer="1688" from-port="0" to-layer="1689" to-port="2" /> + <edge from-layer="1689" from-port="3" to-layer="1690" to-port="3" /> + <edge from-layer="1690" from-port="4" to-layer="1691" to-port="1" /> + <edge from-layer="1691" from-port="2" to-layer="1693" to-port="0" /> + <edge from-layer="1692" from-port="0" to-layer="1693" to-port="1" /> + <edge from-layer="1693" from-port="2" to-layer="1707" to-port="2" /> + <edge from-layer="1694" from-port="0" to-layer="1706" to-port="1" /> + <edge from-layer="1695" from-port="1" to-layer="1698" to-port="0" /> + <edge from-layer="1696" from-port="0" to-layer="1698" to-port="1" /> + <edge from-layer="1697" from-port="0" to-layer="1698" to-port="2" /> + <edge from-layer="1698" from-port="3" to-layer="1703" to-port="0" /> + <edge from-layer="1699" from-port="1" to-layer="1702" to-port="0" /> + <edge from-layer="1700" from-port="0" to-layer="1702" to-port="1" /> + <edge from-layer="1701" from-port="0" to-layer="1702" to-port="2" /> + <edge from-layer="1702" from-port="3" to-layer="1703" to-port="1" /> + <edge from-layer="1703" from-port="2" to-layer="1706" to-port="2" /> + <edge from-layer="1704" from-port="0" to-layer="1706" to-port="3" /> + <edge from-layer="1705" from-port="0" to-layer="1706" to-port="4" /> + <edge from-layer="1706" from-port="5" to-layer="1707" to-port="3" /> + <edge from-layer="1707" from-port="4" to-layer="1709" to-port="0" /> + <edge from-layer="1708" from-port="0" to-layer="1709" to-port="1" /> + <edge from-layer="1709" from-port="2" to-layer="1711" to-port="0" /> + <edge from-layer="1710" from-port="0" to-layer="1711" to-port="1" /> + <edge from-layer="1711" from-port="2" to-layer="1722" to-port="0" /> + <edge from-layer="1712" from-port="0" to-layer="1713" to-port="0" /> + <edge from-layer="1713" from-port="1" to-layer="1716" to-port="0" /> + <edge from-layer="1714" from-port="0" to-layer="1715" to-port="0" /> + <edge from-layer="1715" from-port="1" to-layer="1716" to-port="1" /> + <edge from-layer="1716" from-port="2" to-layer="1718" to-port="0" /> + <edge from-layer="1717" from-port="0" to-layer="1718" to-port="1" /> + <edge from-layer="1718" from-port="2" to-layer="1720" to-port="0" /> + <edge from-layer="1719" from-port="0" to-layer="1720" to-port="1" /> + <edge from-layer="1720" from-port="2" to-layer="1721" to-port="0" /> + <edge from-layer="1721" from-port="1" to-layer="1722" to-port="1" /> + <edge from-layer="1722" from-port="2" to-layer="1723" to-port="1" /> + <edge from-layer="1723" from-port="2" to-layer="1771" to-port="0" /> + <edge from-layer="1723" from-port="2" to-layer="1734" to-port="0" /> + <edge from-layer="1723" from-port="2" to-layer="1727" to-port="0" /> + <edge from-layer="1724" from-port="0" to-layer="1735" to-port="0" /> + <edge from-layer="1725" from-port="0" to-layer="1733" to-port="0" /> + <edge from-layer="1726" from-port="0" to-layer="1727" to-port="1" /> + <edge from-layer="1727" from-port="2" to-layer="1729" to-port="0" /> + <edge from-layer="1728" from-port="0" to-layer="1729" to-port="1" /> + <edge from-layer="1729" from-port="2" to-layer="1731" to-port="0" /> + <edge from-layer="1730" from-port="0" to-layer="1731" to-port="1" /> + <edge from-layer="1731" from-port="2" to-layer="1732" to-port="0" /> + <edge from-layer="1732" from-port="1" to-layer="1733" to-port="1" /> + <edge from-layer="1733" from-port="2" to-layer="1734" to-port="1" /> + <edge from-layer="1734" from-port="2" to-layer="1735" to-port="1" /> + <edge from-layer="1735" from-port="2" to-layer="1746" to-port="0" /> + <edge from-layer="1735" from-port="2" to-layer="1758" to-port="0" /> + <edge from-layer="1736" from-port="0" to-layer="1737" to-port="0" /> + <edge from-layer="1737" from-port="1" to-layer="1740" to-port="0" /> + <edge from-layer="1738" from-port="0" to-layer="1739" to-port="0" /> + <edge from-layer="1739" from-port="1" to-layer="1740" to-port="1" /> + <edge from-layer="1740" from-port="2" to-layer="1742" to-port="0" /> + <edge from-layer="1741" from-port="0" to-layer="1742" to-port="1" /> + <edge from-layer="1742" from-port="2" to-layer="1744" to-port="0" /> + <edge from-layer="1743" from-port="0" to-layer="1744" to-port="1" /> + <edge from-layer="1744" from-port="2" to-layer="1745" to-port="0" /> + <edge from-layer="1745" from-port="1" to-layer="1746" to-port="1" /> + <edge from-layer="1746" from-port="2" to-layer="1747" to-port="0" /> + <edge from-layer="1747" from-port="1" to-layer="1759" to-port="0" /> + <edge from-layer="1748" from-port="0" to-layer="1749" to-port="0" /> + <edge from-layer="1749" from-port="1" to-layer="1752" to-port="0" /> + <edge from-layer="1750" from-port="0" to-layer="1751" to-port="0" /> + <edge from-layer="1751" from-port="1" to-layer="1752" to-port="1" /> + <edge from-layer="1752" from-port="2" to-layer="1754" to-port="0" /> + <edge from-layer="1753" from-port="0" to-layer="1754" to-port="1" /> + <edge from-layer="1754" from-port="2" to-layer="1756" to-port="0" /> + <edge from-layer="1755" from-port="0" to-layer="1756" to-port="1" /> + <edge from-layer="1756" from-port="2" to-layer="1757" to-port="0" /> + <edge from-layer="1757" from-port="1" to-layer="1758" to-port="1" /> + <edge from-layer="1758" from-port="2" to-layer="1759" to-port="1" /> + <edge from-layer="1759" from-port="2" to-layer="1770" to-port="0" /> + <edge from-layer="1760" from-port="0" to-layer="1761" to-port="0" /> + <edge from-layer="1761" from-port="1" to-layer="1764" to-port="0" /> + <edge from-layer="1762" from-port="0" to-layer="1763" to-port="0" /> + <edge from-layer="1763" from-port="1" to-layer="1764" to-port="1" /> + <edge from-layer="1764" from-port="2" to-layer="1766" to-port="0" /> + <edge from-layer="1765" from-port="0" to-layer="1766" to-port="1" /> + <edge from-layer="1766" from-port="2" to-layer="1768" to-port="0" /> + <edge from-layer="1767" from-port="0" to-layer="1768" to-port="1" /> + <edge from-layer="1768" from-port="2" to-layer="1769" to-port="0" /> + <edge from-layer="1769" from-port="1" to-layer="1770" to-port="1" /> + <edge from-layer="1770" from-port="2" to-layer="1771" to-port="1" /> + <edge from-layer="1771" from-port="2" to-layer="1775" to-port="0" /> + <edge from-layer="1771" from-port="2" to-layer="1955" to-port="0" /> + <edge from-layer="1771" from-port="2" to-layer="1782" to-port="0" /> + <edge from-layer="1772" from-port="0" to-layer="1783" to-port="0" /> + <edge from-layer="1773" from-port="0" to-layer="1781" to-port="0" /> + <edge from-layer="1774" from-port="0" to-layer="1775" to-port="1" /> + <edge from-layer="1775" from-port="2" to-layer="1777" to-port="0" /> + <edge from-layer="1776" from-port="0" to-layer="1777" to-port="1" /> + <edge from-layer="1777" from-port="2" to-layer="1779" to-port="0" /> + <edge from-layer="1778" from-port="0" to-layer="1779" to-port="1" /> + <edge from-layer="1779" from-port="2" to-layer="1780" to-port="0" /> + <edge from-layer="1780" from-port="1" to-layer="1781" to-port="1" /> + <edge from-layer="1781" from-port="2" to-layer="1782" to-port="1" /> + <edge from-layer="1782" from-port="2" to-layer="1783" to-port="1" /> + <edge from-layer="1783" from-port="2" to-layer="1794" to-port="0" /> + <edge from-layer="1783" from-port="2" to-layer="1904" to-port="0" /> + <edge from-layer="1783" from-port="2" to-layer="1842" to-port="0" /> + <edge from-layer="1784" from-port="0" to-layer="1785" to-port="0" /> + <edge from-layer="1785" from-port="1" to-layer="1788" to-port="0" /> + <edge from-layer="1786" from-port="0" to-layer="1787" to-port="0" /> + <edge from-layer="1787" from-port="1" to-layer="1788" to-port="1" /> + <edge from-layer="1788" from-port="2" to-layer="1790" to-port="0" /> + <edge from-layer="1789" from-port="0" to-layer="1790" to-port="1" /> + <edge from-layer="1790" from-port="2" to-layer="1792" to-port="0" /> + <edge from-layer="1791" from-port="0" to-layer="1792" to-port="1" /> + <edge from-layer="1792" from-port="2" to-layer="1793" to-port="0" /> + <edge from-layer="1793" from-port="1" to-layer="1794" to-port="1" /> + <edge from-layer="1794" from-port="2" to-layer="1797" to-port="0" /> + <edge from-layer="1795" from-port="0" to-layer="1796" to-port="0" /> + <edge from-layer="1796" from-port="1" to-layer="1797" to-port="1" /> + <edge from-layer="1797" from-port="2" to-layer="1799" to-port="0" /> + <edge from-layer="1798" from-port="0" to-layer="1799" to-port="1" /> + <edge from-layer="1799" from-port="2" to-layer="1801" to-port="0" /> + <edge from-layer="1800" from-port="0" to-layer="1801" to-port="1" /> + <edge from-layer="1801" from-port="2" to-layer="1802" to-port="0" /> + <edge from-layer="1801" from-port="2" to-layer="1803" to-port="0" /> + <edge from-layer="1801" from-port="2" to-layer="1813" to-port="0" /> + <edge from-layer="1801" from-port="2" to-layer="1819" to-port="0" /> + <edge from-layer="1802" from-port="2" to-layer="1822" to-port="0" /> + <edge from-layer="1803" from-port="1" to-layer="1805" to-port="0" /> + <edge from-layer="1804" from-port="0" to-layer="1805" to-port="2" /> + <edge from-layer="1805" from-port="3" to-layer="1806" to-port="0" /> + <edge from-layer="1806" from-port="2" to-layer="1807" to-port="0" /> + <edge from-layer="1807" from-port="1" to-layer="1809" to-port="0" /> + <edge from-layer="1808" from-port="0" to-layer="1809" to-port="1" /> + <edge from-layer="1809" from-port="2" to-layer="1813" to-port="1" /> + <edge from-layer="1809" from-port="2" to-layer="1819" to-port="2" /> + <edge from-layer="1810" from-port="0" to-layer="1813" to-port="2" /> + <edge from-layer="1811" from-port="0" to-layer="1813" to-port="3" /> + <edge from-layer="1812" from-port="0" to-layer="1813" to-port="4" /> + <edge from-layer="1813" from-port="5" to-layer="1815" to-port="0" /> + <edge from-layer="1814" from-port="0" to-layer="1815" to-port="1" /> + <edge from-layer="1815" from-port="2" to-layer="1820" to-port="0" /> + <edge from-layer="1816" from-port="0" to-layer="1819" to-port="1" /> + <edge from-layer="1817" from-port="0" to-layer="1819" to-port="3" /> + <edge from-layer="1818" from-port="0" to-layer="1819" to-port="4" /> + <edge from-layer="1819" from-port="5" to-layer="1820" to-port="1" /> + <edge from-layer="1820" from-port="2" to-layer="1821" to-port="0" /> + <edge from-layer="1821" from-port="2" to-layer="1822" to-port="1" /> + <edge from-layer="1822" from-port="2" to-layer="1939" to-port="0" /> + <edge from-layer="1823" from-port="0" to-layer="1828" to-port="0" /> + <edge from-layer="1824" from-port="0" to-layer="1827" to-port="1" /> + <edge from-layer="1825" from-port="0" to-layer="1827" to-port="2" /> + <edge from-layer="1826" from-port="0" to-layer="1827" to-port="3" /> + <edge from-layer="1827" from-port="4" to-layer="1828" to-port="1" /> + <edge from-layer="1828" from-port="2" to-layer="1829" to-port="0" /> + <edge from-layer="1829" from-port="1" to-layer="1831" to-port="0" /> + <edge from-layer="1830" from-port="0" to-layer="1831" to-port="2" /> + <edge from-layer="1831" from-port="3" to-layer="1927" to-port="0" /> + <edge from-layer="1831" from-port="3" to-layer="1871" to-port="0" /> + <edge from-layer="1832" from-port="0" to-layer="1833" to-port="0" /> + <edge from-layer="1833" from-port="1" to-layer="1836" to-port="0" /> + <edge from-layer="1834" from-port="0" to-layer="1835" to-port="0" /> + <edge from-layer="1835" from-port="1" to-layer="1836" to-port="1" /> + <edge from-layer="1836" from-port="2" to-layer="1838" to-port="0" /> + <edge from-layer="1837" from-port="0" to-layer="1838" to-port="1" /> + <edge from-layer="1838" from-port="2" to-layer="1840" to-port="0" /> + <edge from-layer="1839" from-port="0" to-layer="1840" to-port="1" /> + <edge from-layer="1840" from-port="2" to-layer="1841" to-port="0" /> + <edge from-layer="1841" from-port="1" to-layer="1842" to-port="1" /> + <edge from-layer="1842" from-port="2" to-layer="1845" to-port="0" /> + <edge from-layer="1843" from-port="0" to-layer="1844" to-port="0" /> + <edge from-layer="1844" from-port="1" to-layer="1845" to-port="1" /> + <edge from-layer="1845" from-port="2" to-layer="1847" to-port="0" /> + <edge from-layer="1846" from-port="0" to-layer="1847" to-port="1" /> + <edge from-layer="1847" from-port="2" to-layer="1849" to-port="0" /> + <edge from-layer="1848" from-port="0" to-layer="1849" to-port="1" /> + <edge from-layer="1849" from-port="2" to-layer="1867" to-port="0" /> + <edge from-layer="1849" from-port="2" to-layer="1850" to-port="0" /> + <edge from-layer="1849" from-port="2" to-layer="1861" to-port="0" /> + <edge from-layer="1849" from-port="2" to-layer="1851" to-port="0" /> + <edge from-layer="1850" from-port="2" to-layer="1870" to-port="0" /> + <edge from-layer="1851" from-port="1" to-layer="1853" to-port="0" /> + <edge from-layer="1852" from-port="0" to-layer="1853" to-port="2" /> + <edge from-layer="1853" from-port="3" to-layer="1854" to-port="0" /> + <edge from-layer="1854" from-port="2" to-layer="1855" to-port="0" /> + <edge from-layer="1855" from-port="1" to-layer="1857" to-port="0" /> + <edge from-layer="1856" from-port="0" to-layer="1857" to-port="1" /> + <edge from-layer="1857" from-port="2" to-layer="1867" to-port="2" /> + <edge from-layer="1857" from-port="2" to-layer="1861" to-port="1" /> + <edge from-layer="1858" from-port="0" to-layer="1861" to-port="2" /> + <edge from-layer="1859" from-port="0" to-layer="1861" to-port="3" /> + <edge from-layer="1860" from-port="0" to-layer="1861" to-port="4" /> + <edge from-layer="1861" from-port="5" to-layer="1863" to-port="0" /> + <edge from-layer="1862" from-port="0" to-layer="1863" to-port="1" /> + <edge from-layer="1863" from-port="2" to-layer="1868" to-port="0" /> + <edge from-layer="1864" from-port="0" to-layer="1867" to-port="1" /> + <edge from-layer="1865" from-port="0" to-layer="1867" to-port="3" /> + <edge from-layer="1866" from-port="0" to-layer="1867" to-port="4" /> + <edge from-layer="1867" from-port="5" to-layer="1868" to-port="1" /> + <edge from-layer="1868" from-port="2" to-layer="1869" to-port="0" /> + <edge from-layer="1869" from-port="2" to-layer="1870" to-port="1" /> + <edge from-layer="1870" from-port="2" to-layer="1871" to-port="1" /> + <edge from-layer="1870" from-port="2" to-layer="1931" to-port="0" /> + <edge from-layer="1871" from-port="2" to-layer="2320" to-port="0" /> + <edge from-layer="1871" from-port="2" to-layer="1872" to-port="0" /> + <edge from-layer="1871" from-port="2" to-layer="1873" to-port="0" /> + <edge from-layer="1872" from-port="2" to-layer="1882" to-port="0" /> + <edge from-layer="1873" from-port="1" to-layer="1876" to-port="0" /> + <edge from-layer="1873" from-port="1" to-layer="1880" to-port="0" /> + <edge from-layer="1874" from-port="0" to-layer="1876" to-port="1" /> + <edge from-layer="1875" from-port="0" to-layer="1876" to-port="2" /> + <edge from-layer="1876" from-port="3" to-layer="1881" to-port="0" /> + <edge from-layer="1877" from-port="0" to-layer="1881" to-port="1" /> + <edge from-layer="1878" from-port="0" to-layer="1880" to-port="1" /> + <edge from-layer="1879" from-port="0" to-layer="1880" to-port="2" /> + <edge from-layer="1880" from-port="3" to-layer="1881" to-port="2" /> + <edge from-layer="1881" from-port="3" to-layer="1882" to-port="1" /> + <edge from-layer="1882" from-port="2" to-layer="1884" to-port="0" /> + <edge from-layer="1883" from-port="0" to-layer="1884" to-port="1" /> + <edge from-layer="1884" from-port="2" to-layer="1939" to-port="1" /> + <edge from-layer="1885" from-port="0" to-layer="1890" to-port="0" /> + <edge from-layer="1886" from-port="0" to-layer="1889" to-port="1" /> + <edge from-layer="1887" from-port="0" to-layer="1889" to-port="2" /> + <edge from-layer="1888" from-port="0" to-layer="1889" to-port="3" /> + <edge from-layer="1889" from-port="4" to-layer="1890" to-port="1" /> + <edge from-layer="1890" from-port="2" to-layer="1891" to-port="0" /> + <edge from-layer="1891" from-port="1" to-layer="1893" to-port="0" /> + <edge from-layer="1892" from-port="0" to-layer="1893" to-port="2" /> + <edge from-layer="1893" from-port="3" to-layer="1912" to-port="0" /> + <edge from-layer="1894" from-port="0" to-layer="1895" to-port="0" /> + <edge from-layer="1895" from-port="1" to-layer="1898" to-port="0" /> + <edge from-layer="1896" from-port="0" to-layer="1897" to-port="0" /> + <edge from-layer="1897" from-port="1" to-layer="1898" to-port="1" /> + <edge from-layer="1898" from-port="2" to-layer="1900" to-port="0" /> + <edge from-layer="1899" from-port="0" to-layer="1900" to-port="1" /> + <edge from-layer="1900" from-port="2" to-layer="1902" to-port="0" /> + <edge from-layer="1901" from-port="0" to-layer="1902" to-port="1" /> + <edge from-layer="1902" from-port="2" to-layer="1903" to-port="0" /> + <edge from-layer="1903" from-port="1" to-layer="1904" to-port="1" /> + <edge from-layer="1904" from-port="2" to-layer="1907" to-port="0" /> + <edge from-layer="1905" from-port="0" to-layer="1906" to-port="0" /> + <edge from-layer="1906" from-port="1" to-layer="1907" to-port="1" /> + <edge from-layer="1907" from-port="2" to-layer="1909" to-port="0" /> + <edge from-layer="1908" from-port="0" to-layer="1909" to-port="1" /> + <edge from-layer="1909" from-port="2" to-layer="1911" to-port="0" /> + <edge from-layer="1910" from-port="0" to-layer="1911" to-port="1" /> + <edge from-layer="1911" from-port="2" to-layer="1912" to-port="1" /> + <edge from-layer="1912" from-port="2" to-layer="2319" to-port="0" /> + <edge from-layer="1912" from-port="2" to-layer="1913" to-port="0" /> + <edge from-layer="1912" from-port="2" to-layer="1914" to-port="0" /> + <edge from-layer="1913" from-port="2" to-layer="1923" to-port="0" /> + <edge from-layer="1914" from-port="1" to-layer="1917" to-port="0" /> + <edge from-layer="1914" from-port="1" to-layer="1921" to-port="0" /> + <edge from-layer="1915" from-port="0" to-layer="1917" to-port="1" /> + <edge from-layer="1916" from-port="0" to-layer="1917" to-port="2" /> + <edge from-layer="1917" from-port="3" to-layer="1922" to-port="1" /> + <edge from-layer="1918" from-port="0" to-layer="1922" to-port="2" /> + <edge from-layer="1919" from-port="0" to-layer="1921" to-port="1" /> + <edge from-layer="1920" from-port="0" to-layer="1921" to-port="2" /> + <edge from-layer="1921" from-port="3" to-layer="1922" to-port="3" /> + <edge from-layer="1922" from-port="4" to-layer="1923" to-port="1" /> + <edge from-layer="1923" from-port="2" to-layer="1925" to-port="0" /> + <edge from-layer="1924" from-port="0" to-layer="1925" to-port="1" /> + <edge from-layer="1925" from-port="2" to-layer="1939" to-port="2" /> + <edge from-layer="1926" from-port="0" to-layer="1938" to-port="1" /> + <edge from-layer="1927" from-port="1" to-layer="1930" to-port="0" /> + <edge from-layer="1928" from-port="0" to-layer="1930" to-port="1" /> + <edge from-layer="1929" from-port="0" to-layer="1930" to-port="2" /> + <edge from-layer="1930" from-port="3" to-layer="1935" to-port="0" /> + <edge from-layer="1931" from-port="1" to-layer="1934" to-port="0" /> + <edge from-layer="1932" from-port="0" to-layer="1934" to-port="1" /> + <edge from-layer="1933" from-port="0" to-layer="1934" to-port="2" /> + <edge from-layer="1934" from-port="3" to-layer="1935" to-port="1" /> + <edge from-layer="1935" from-port="2" to-layer="1938" to-port="2" /> + <edge from-layer="1936" from-port="0" to-layer="1938" to-port="3" /> + <edge from-layer="1937" from-port="0" to-layer="1938" to-port="4" /> + <edge from-layer="1938" from-port="5" to-layer="1939" to-port="3" /> + <edge from-layer="1939" from-port="4" to-layer="1941" to-port="0" /> + <edge from-layer="1940" from-port="0" to-layer="1941" to-port="1" /> + <edge from-layer="1941" from-port="2" to-layer="1943" to-port="0" /> + <edge from-layer="1942" from-port="0" to-layer="1943" to-port="1" /> + <edge from-layer="1943" from-port="2" to-layer="1954" to-port="0" /> + <edge from-layer="1944" from-port="0" to-layer="1945" to-port="0" /> + <edge from-layer="1945" from-port="1" to-layer="1948" to-port="0" /> + <edge from-layer="1946" from-port="0" to-layer="1947" to-port="0" /> + <edge from-layer="1947" from-port="1" to-layer="1948" to-port="1" /> + <edge from-layer="1948" from-port="2" to-layer="1950" to-port="0" /> + <edge from-layer="1949" from-port="0" to-layer="1950" to-port="1" /> + <edge from-layer="1950" from-port="2" to-layer="1952" to-port="0" /> + <edge from-layer="1951" from-port="0" to-layer="1952" to-port="1" /> + <edge from-layer="1952" from-port="2" to-layer="1953" to-port="0" /> + <edge from-layer="1953" from-port="1" to-layer="1954" to-port="1" /> + <edge from-layer="1954" from-port="2" to-layer="1955" to-port="1" /> + <edge from-layer="1955" from-port="2" to-layer="1959" to-port="0" /> + <edge from-layer="1955" from-port="2" to-layer="2003" to-port="0" /> + <edge from-layer="1955" from-port="2" to-layer="1966" to-port="0" /> + <edge from-layer="1956" from-port="0" to-layer="1967" to-port="0" /> + <edge from-layer="1957" from-port="0" to-layer="1965" to-port="0" /> + <edge from-layer="1958" from-port="0" to-layer="1959" to-port="1" /> + <edge from-layer="1959" from-port="2" to-layer="1961" to-port="0" /> + <edge from-layer="1960" from-port="0" to-layer="1961" to-port="1" /> + <edge from-layer="1961" from-port="2" to-layer="1963" to-port="0" /> + <edge from-layer="1962" from-port="0" to-layer="1963" to-port="1" /> + <edge from-layer="1963" from-port="2" to-layer="1964" to-port="0" /> + <edge from-layer="1964" from-port="1" to-layer="1965" to-port="1" /> + <edge from-layer="1965" from-port="2" to-layer="1966" to-port="1" /> + <edge from-layer="1966" from-port="2" to-layer="1967" to-port="1" /> + <edge from-layer="1967" from-port="2" to-layer="1990" to-port="0" /> + <edge from-layer="1967" from-port="2" to-layer="1978" to-port="0" /> + <edge from-layer="1968" from-port="0" to-layer="1969" to-port="0" /> + <edge from-layer="1969" from-port="1" to-layer="1972" to-port="0" /> + <edge from-layer="1970" from-port="0" to-layer="1971" to-port="0" /> + <edge from-layer="1971" from-port="1" to-layer="1972" to-port="1" /> + <edge from-layer="1972" from-port="2" to-layer="1974" to-port="0" /> + <edge from-layer="1973" from-port="0" to-layer="1974" to-port="1" /> + <edge from-layer="1974" from-port="2" to-layer="1976" to-port="0" /> + <edge from-layer="1975" from-port="0" to-layer="1976" to-port="1" /> + <edge from-layer="1976" from-port="2" to-layer="1977" to-port="0" /> + <edge from-layer="1977" from-port="1" to-layer="1978" to-port="1" /> + <edge from-layer="1978" from-port="2" to-layer="1979" to-port="0" /> + <edge from-layer="1979" from-port="1" to-layer="1991" to-port="0" /> + <edge from-layer="1980" from-port="0" to-layer="1981" to-port="0" /> + <edge from-layer="1981" from-port="1" to-layer="1984" to-port="0" /> + <edge from-layer="1982" from-port="0" to-layer="1983" to-port="0" /> + <edge from-layer="1983" from-port="1" to-layer="1984" to-port="1" /> + <edge from-layer="1984" from-port="2" to-layer="1986" to-port="0" /> + <edge from-layer="1985" from-port="0" to-layer="1986" to-port="1" /> + <edge from-layer="1986" from-port="2" to-layer="1988" to-port="0" /> + <edge from-layer="1987" from-port="0" to-layer="1988" to-port="1" /> + <edge from-layer="1988" from-port="2" to-layer="1989" to-port="0" /> + <edge from-layer="1989" from-port="1" to-layer="1990" to-port="1" /> + <edge from-layer="1990" from-port="2" to-layer="1991" to-port="1" /> + <edge from-layer="1991" from-port="2" to-layer="2002" to-port="0" /> + <edge from-layer="1992" from-port="0" to-layer="1993" to-port="0" /> + <edge from-layer="1993" from-port="1" to-layer="1996" to-port="0" /> + <edge from-layer="1994" from-port="0" to-layer="1995" to-port="0" /> + <edge from-layer="1995" from-port="1" to-layer="1996" to-port="1" /> + <edge from-layer="1996" from-port="2" to-layer="1998" to-port="0" /> + <edge from-layer="1997" from-port="0" to-layer="1998" to-port="1" /> + <edge from-layer="1998" from-port="2" to-layer="2000" to-port="0" /> + <edge from-layer="1999" from-port="0" to-layer="2000" to-port="1" /> + <edge from-layer="2000" from-port="2" to-layer="2001" to-port="0" /> + <edge from-layer="2001" from-port="1" to-layer="2002" to-port="1" /> + <edge from-layer="2002" from-port="2" to-layer="2003" to-port="1" /> + <edge from-layer="2003" from-port="2" to-layer="2007" to-port="0" /> + <edge from-layer="2003" from-port="2" to-layer="2187" to-port="0" /> + <edge from-layer="2003" from-port="2" to-layer="2014" to-port="0" /> + <edge from-layer="2004" from-port="0" to-layer="2015" to-port="0" /> + <edge from-layer="2005" from-port="0" to-layer="2013" to-port="0" /> + <edge from-layer="2006" from-port="0" to-layer="2007" to-port="1" /> + <edge from-layer="2007" from-port="2" to-layer="2009" to-port="0" /> + <edge from-layer="2008" from-port="0" to-layer="2009" to-port="1" /> + <edge from-layer="2009" from-port="2" to-layer="2011" to-port="0" /> + <edge from-layer="2010" from-port="0" to-layer="2011" to-port="1" /> + <edge from-layer="2011" from-port="2" to-layer="2012" to-port="0" /> + <edge from-layer="2012" from-port="1" to-layer="2013" to-port="1" /> + <edge from-layer="2013" from-port="2" to-layer="2014" to-port="1" /> + <edge from-layer="2014" from-port="2" to-layer="2015" to-port="1" /> + <edge from-layer="2015" from-port="2" to-layer="2074" to-port="0" /> + <edge from-layer="2015" from-port="2" to-layer="2136" to-port="0" /> + <edge from-layer="2015" from-port="2" to-layer="2026" to-port="0" /> + <edge from-layer="2016" from-port="0" to-layer="2017" to-port="0" /> + <edge from-layer="2017" from-port="1" to-layer="2020" to-port="0" /> + <edge from-layer="2018" from-port="0" to-layer="2019" to-port="0" /> + <edge from-layer="2019" from-port="1" to-layer="2020" to-port="1" /> + <edge from-layer="2020" from-port="2" to-layer="2022" to-port="0" /> + <edge from-layer="2021" from-port="0" to-layer="2022" to-port="1" /> + <edge from-layer="2022" from-port="2" to-layer="2024" to-port="0" /> + <edge from-layer="2023" from-port="0" to-layer="2024" to-port="1" /> + <edge from-layer="2024" from-port="2" to-layer="2025" to-port="0" /> + <edge from-layer="2025" from-port="1" to-layer="2026" to-port="1" /> + <edge from-layer="2026" from-port="2" to-layer="2029" to-port="0" /> + <edge from-layer="2027" from-port="0" to-layer="2028" to-port="0" /> + <edge from-layer="2028" from-port="1" to-layer="2029" to-port="1" /> + <edge from-layer="2029" from-port="2" to-layer="2031" to-port="0" /> + <edge from-layer="2030" from-port="0" to-layer="2031" to-port="1" /> + <edge from-layer="2031" from-port="2" to-layer="2033" to-port="0" /> + <edge from-layer="2032" from-port="0" to-layer="2033" to-port="1" /> + <edge from-layer="2033" from-port="2" to-layer="2045" to-port="0" /> + <edge from-layer="2033" from-port="2" to-layer="2051" to-port="0" /> + <edge from-layer="2033" from-port="2" to-layer="2035" to-port="0" /> + <edge from-layer="2033" from-port="2" to-layer="2034" to-port="0" /> + <edge from-layer="2034" from-port="2" to-layer="2054" to-port="0" /> + <edge from-layer="2035" from-port="1" to-layer="2037" to-port="0" /> + <edge from-layer="2036" from-port="0" to-layer="2037" to-port="2" /> + <edge from-layer="2037" from-port="3" to-layer="2038" to-port="0" /> + <edge from-layer="2038" from-port="2" to-layer="2039" to-port="0" /> + <edge from-layer="2039" from-port="1" to-layer="2041" to-port="0" /> + <edge from-layer="2040" from-port="0" to-layer="2041" to-port="1" /> + <edge from-layer="2041" from-port="2" to-layer="2045" to-port="1" /> + <edge from-layer="2041" from-port="2" to-layer="2051" to-port="2" /> + <edge from-layer="2042" from-port="0" to-layer="2045" to-port="2" /> + <edge from-layer="2043" from-port="0" to-layer="2045" to-port="3" /> + <edge from-layer="2044" from-port="0" to-layer="2045" to-port="4" /> + <edge from-layer="2045" from-port="5" to-layer="2047" to-port="0" /> + <edge from-layer="2046" from-port="0" to-layer="2047" to-port="1" /> + <edge from-layer="2047" from-port="2" to-layer="2052" to-port="0" /> + <edge from-layer="2048" from-port="0" to-layer="2051" to-port="1" /> + <edge from-layer="2049" from-port="0" to-layer="2051" to-port="3" /> + <edge from-layer="2050" from-port="0" to-layer="2051" to-port="4" /> + <edge from-layer="2051" from-port="5" to-layer="2052" to-port="1" /> + <edge from-layer="2052" from-port="2" to-layer="2053" to-port="0" /> + <edge from-layer="2053" from-port="2" to-layer="2054" to-port="1" /> + <edge from-layer="2054" from-port="2" to-layer="2171" to-port="0" /> + <edge from-layer="2055" from-port="0" to-layer="2060" to-port="0" /> + <edge from-layer="2056" from-port="0" to-layer="2059" to-port="1" /> + <edge from-layer="2057" from-port="0" to-layer="2059" to-port="2" /> + <edge from-layer="2058" from-port="0" to-layer="2059" to-port="3" /> + <edge from-layer="2059" from-port="4" to-layer="2060" to-port="1" /> + <edge from-layer="2060" from-port="2" to-layer="2061" to-port="0" /> + <edge from-layer="2061" from-port="1" to-layer="2063" to-port="0" /> + <edge from-layer="2062" from-port="0" to-layer="2063" to-port="2" /> + <edge from-layer="2063" from-port="3" to-layer="2159" to-port="0" /> + <edge from-layer="2063" from-port="3" to-layer="2103" to-port="0" /> + <edge from-layer="2064" from-port="0" to-layer="2065" to-port="0" /> + <edge from-layer="2065" from-port="1" to-layer="2068" to-port="0" /> + <edge from-layer="2066" from-port="0" to-layer="2067" to-port="0" /> + <edge from-layer="2067" from-port="1" to-layer="2068" to-port="1" /> + <edge from-layer="2068" from-port="2" to-layer="2070" to-port="0" /> + <edge from-layer="2069" from-port="0" to-layer="2070" to-port="1" /> + <edge from-layer="2070" from-port="2" to-layer="2072" to-port="0" /> + <edge from-layer="2071" from-port="0" to-layer="2072" to-port="1" /> + <edge from-layer="2072" from-port="2" to-layer="2073" to-port="0" /> + <edge from-layer="2073" from-port="1" to-layer="2074" to-port="1" /> + <edge from-layer="2074" from-port="2" to-layer="2077" to-port="0" /> + <edge from-layer="2075" from-port="0" to-layer="2076" to-port="0" /> + <edge from-layer="2076" from-port="1" to-layer="2077" to-port="1" /> + <edge from-layer="2077" from-port="2" to-layer="2079" to-port="0" /> + <edge from-layer="2078" from-port="0" to-layer="2079" to-port="1" /> + <edge from-layer="2079" from-port="2" to-layer="2081" to-port="0" /> + <edge from-layer="2080" from-port="0" to-layer="2081" to-port="1" /> + <edge from-layer="2081" from-port="2" to-layer="2099" to-port="0" /> + <edge from-layer="2081" from-port="2" to-layer="2082" to-port="0" /> + <edge from-layer="2081" from-port="2" to-layer="2083" to-port="0" /> + <edge from-layer="2081" from-port="2" to-layer="2093" to-port="0" /> + <edge from-layer="2082" from-port="2" to-layer="2102" to-port="0" /> + <edge from-layer="2083" from-port="1" to-layer="2085" to-port="0" /> + <edge from-layer="2084" from-port="0" to-layer="2085" to-port="2" /> + <edge from-layer="2085" from-port="3" to-layer="2086" to-port="0" /> + <edge from-layer="2086" from-port="2" to-layer="2087" to-port="0" /> + <edge from-layer="2087" from-port="1" to-layer="2089" to-port="0" /> + <edge from-layer="2088" from-port="0" to-layer="2089" to-port="1" /> + <edge from-layer="2089" from-port="2" to-layer="2093" to-port="1" /> + <edge from-layer="2089" from-port="2" to-layer="2099" to-port="2" /> + <edge from-layer="2090" from-port="0" to-layer="2093" to-port="2" /> + <edge from-layer="2091" from-port="0" to-layer="2093" to-port="3" /> + <edge from-layer="2092" from-port="0" to-layer="2093" to-port="4" /> + <edge from-layer="2093" from-port="5" to-layer="2095" to-port="0" /> + <edge from-layer="2094" from-port="0" to-layer="2095" to-port="1" /> + <edge from-layer="2095" from-port="2" to-layer="2100" to-port="0" /> + <edge from-layer="2096" from-port="0" to-layer="2099" to-port="1" /> + <edge from-layer="2097" from-port="0" to-layer="2099" to-port="3" /> + <edge from-layer="2098" from-port="0" to-layer="2099" to-port="4" /> + <edge from-layer="2099" from-port="5" to-layer="2100" to-port="1" /> + <edge from-layer="2100" from-port="2" to-layer="2101" to-port="0" /> + <edge from-layer="2101" from-port="2" to-layer="2102" to-port="1" /> + <edge from-layer="2102" from-port="2" to-layer="2163" to-port="0" /> + <edge from-layer="2102" from-port="2" to-layer="2103" to-port="1" /> + <edge from-layer="2103" from-port="2" to-layer="2105" to-port="0" /> + <edge from-layer="2103" from-port="2" to-layer="2104" to-port="0" /> + <edge from-layer="2103" from-port="2" to-layer="2318" to-port="0" /> + <edge from-layer="2104" from-port="2" to-layer="2114" to-port="0" /> + <edge from-layer="2105" from-port="1" to-layer="2112" to-port="0" /> + <edge from-layer="2105" from-port="1" to-layer="2108" to-port="0" /> + <edge from-layer="2106" from-port="0" to-layer="2108" to-port="1" /> + <edge from-layer="2107" from-port="0" to-layer="2108" to-port="2" /> + <edge from-layer="2108" from-port="3" to-layer="2113" to-port="0" /> + <edge from-layer="2109" from-port="0" to-layer="2113" to-port="1" /> + <edge from-layer="2110" from-port="0" to-layer="2112" to-port="1" /> + <edge from-layer="2111" from-port="0" to-layer="2112" to-port="2" /> + <edge from-layer="2112" from-port="3" to-layer="2113" to-port="2" /> + <edge from-layer="2113" from-port="3" to-layer="2114" to-port="1" /> + <edge from-layer="2114" from-port="2" to-layer="2116" to-port="0" /> + <edge from-layer="2115" from-port="0" to-layer="2116" to-port="1" /> + <edge from-layer="2116" from-port="2" to-layer="2171" to-port="1" /> + <edge from-layer="2117" from-port="0" to-layer="2122" to-port="0" /> + <edge from-layer="2118" from-port="0" to-layer="2121" to-port="1" /> + <edge from-layer="2119" from-port="0" to-layer="2121" to-port="2" /> + <edge from-layer="2120" from-port="0" to-layer="2121" to-port="3" /> + <edge from-layer="2121" from-port="4" to-layer="2122" to-port="1" /> + <edge from-layer="2122" from-port="2" to-layer="2123" to-port="0" /> + <edge from-layer="2123" from-port="1" to-layer="2125" to-port="0" /> + <edge from-layer="2124" from-port="0" to-layer="2125" to-port="2" /> + <edge from-layer="2125" from-port="3" to-layer="2144" to-port="0" /> + <edge from-layer="2126" from-port="0" to-layer="2127" to-port="0" /> + <edge from-layer="2127" from-port="1" to-layer="2130" to-port="0" /> + <edge from-layer="2128" from-port="0" to-layer="2129" to-port="0" /> + <edge from-layer="2129" from-port="1" to-layer="2130" to-port="1" /> + <edge from-layer="2130" from-port="2" to-layer="2132" to-port="0" /> + <edge from-layer="2131" from-port="0" to-layer="2132" to-port="1" /> + <edge from-layer="2132" from-port="2" to-layer="2134" to-port="0" /> + <edge from-layer="2133" from-port="0" to-layer="2134" to-port="1" /> + <edge from-layer="2134" from-port="2" to-layer="2135" to-port="0" /> + <edge from-layer="2135" from-port="1" to-layer="2136" to-port="1" /> + <edge from-layer="2136" from-port="2" to-layer="2139" to-port="0" /> + <edge from-layer="2137" from-port="0" to-layer="2138" to-port="0" /> + <edge from-layer="2138" from-port="1" to-layer="2139" to-port="1" /> + <edge from-layer="2139" from-port="2" to-layer="2141" to-port="0" /> + <edge from-layer="2140" from-port="0" to-layer="2141" to-port="1" /> + <edge from-layer="2141" from-port="2" to-layer="2143" to-port="0" /> + <edge from-layer="2142" from-port="0" to-layer="2143" to-port="1" /> + <edge from-layer="2143" from-port="2" to-layer="2144" to-port="1" /> + <edge from-layer="2144" from-port="2" to-layer="2317" to-port="0" /> + <edge from-layer="2144" from-port="2" to-layer="2145" to-port="0" /> + <edge from-layer="2144" from-port="2" to-layer="2146" to-port="0" /> + <edge from-layer="2145" from-port="2" to-layer="2155" to-port="0" /> + <edge from-layer="2146" from-port="1" to-layer="2149" to-port="0" /> + <edge from-layer="2146" from-port="1" to-layer="2153" to-port="0" /> + <edge from-layer="2147" from-port="0" to-layer="2149" to-port="1" /> + <edge from-layer="2148" from-port="0" to-layer="2149" to-port="2" /> + <edge from-layer="2149" from-port="3" to-layer="2154" to-port="1" /> + <edge from-layer="2150" from-port="0" to-layer="2154" to-port="2" /> + <edge from-layer="2151" from-port="0" to-layer="2153" to-port="1" /> + <edge from-layer="2152" from-port="0" to-layer="2153" to-port="2" /> + <edge from-layer="2153" from-port="3" to-layer="2154" to-port="3" /> + <edge from-layer="2154" from-port="4" to-layer="2155" to-port="1" /> + <edge from-layer="2155" from-port="2" to-layer="2157" to-port="0" /> + <edge from-layer="2156" from-port="0" to-layer="2157" to-port="1" /> + <edge from-layer="2157" from-port="2" to-layer="2171" to-port="2" /> + <edge from-layer="2158" from-port="0" to-layer="2170" to-port="1" /> + <edge from-layer="2159" from-port="1" to-layer="2162" to-port="0" /> + <edge from-layer="2160" from-port="0" to-layer="2162" to-port="1" /> + <edge from-layer="2161" from-port="0" to-layer="2162" to-port="2" /> + <edge from-layer="2162" from-port="3" to-layer="2167" to-port="0" /> + <edge from-layer="2163" from-port="1" to-layer="2166" to-port="0" /> + <edge from-layer="2164" from-port="0" to-layer="2166" to-port="1" /> + <edge from-layer="2165" from-port="0" to-layer="2166" to-port="2" /> + <edge from-layer="2166" from-port="3" to-layer="2167" to-port="1" /> + <edge from-layer="2167" from-port="2" to-layer="2170" to-port="2" /> + <edge from-layer="2168" from-port="0" to-layer="2170" to-port="3" /> + <edge from-layer="2169" from-port="0" to-layer="2170" to-port="4" /> + <edge from-layer="2170" from-port="5" to-layer="2171" to-port="3" /> + <edge from-layer="2171" from-port="4" to-layer="2173" to-port="0" /> + <edge from-layer="2172" from-port="0" to-layer="2173" to-port="1" /> + <edge from-layer="2173" from-port="2" to-layer="2175" to-port="0" /> + <edge from-layer="2174" from-port="0" to-layer="2175" to-port="1" /> + <edge from-layer="2175" from-port="2" to-layer="2186" to-port="0" /> + <edge from-layer="2176" from-port="0" to-layer="2177" to-port="0" /> + <edge from-layer="2177" from-port="1" to-layer="2180" to-port="0" /> + <edge from-layer="2178" from-port="0" to-layer="2179" to-port="0" /> + <edge from-layer="2179" from-port="1" to-layer="2180" to-port="1" /> + <edge from-layer="2180" from-port="2" to-layer="2182" to-port="0" /> + <edge from-layer="2181" from-port="0" to-layer="2182" to-port="1" /> + <edge from-layer="2182" from-port="2" to-layer="2184" to-port="0" /> + <edge from-layer="2183" from-port="0" to-layer="2184" to-port="1" /> + <edge from-layer="2184" from-port="2" to-layer="2185" to-port="0" /> + <edge from-layer="2185" from-port="1" to-layer="2186" to-port="1" /> + <edge from-layer="2186" from-port="2" to-layer="2187" to-port="1" /> + <edge from-layer="2187" from-port="2" to-layer="2235" to-port="0" /> + <edge from-layer="2187" from-port="2" to-layer="2191" to-port="0" /> + <edge from-layer="2187" from-port="2" to-layer="2198" to-port="0" /> + <edge from-layer="2188" from-port="0" to-layer="2199" to-port="0" /> + <edge from-layer="2189" from-port="0" to-layer="2197" to-port="0" /> + <edge from-layer="2190" from-port="0" to-layer="2191" to-port="1" /> + <edge from-layer="2191" from-port="2" to-layer="2193" to-port="0" /> + <edge from-layer="2192" from-port="0" to-layer="2193" to-port="1" /> + <edge from-layer="2193" from-port="2" to-layer="2195" to-port="0" /> + <edge from-layer="2194" from-port="0" to-layer="2195" to-port="1" /> + <edge from-layer="2195" from-port="2" to-layer="2196" to-port="0" /> + <edge from-layer="2196" from-port="1" to-layer="2197" to-port="1" /> + <edge from-layer="2197" from-port="2" to-layer="2198" to-port="1" /> + <edge from-layer="2198" from-port="2" to-layer="2199" to-port="1" /> + <edge from-layer="2199" from-port="2" to-layer="2210" to-port="0" /> + <edge from-layer="2199" from-port="2" to-layer="2222" to-port="0" /> + <edge from-layer="2200" from-port="0" to-layer="2201" to-port="0" /> + <edge from-layer="2201" from-port="1" to-layer="2204" to-port="0" /> + <edge from-layer="2202" from-port="0" to-layer="2203" to-port="0" /> + <edge from-layer="2203" from-port="1" to-layer="2204" to-port="1" /> + <edge from-layer="2204" from-port="2" to-layer="2206" to-port="0" /> + <edge from-layer="2205" from-port="0" to-layer="2206" to-port="1" /> + <edge from-layer="2206" from-port="2" to-layer="2208" to-port="0" /> + <edge from-layer="2207" from-port="0" to-layer="2208" to-port="1" /> + <edge from-layer="2208" from-port="2" to-layer="2209" to-port="0" /> + <edge from-layer="2209" from-port="1" to-layer="2210" to-port="1" /> + <edge from-layer="2210" from-port="2" to-layer="2211" to-port="0" /> + <edge from-layer="2211" from-port="1" to-layer="2223" to-port="0" /> + <edge from-layer="2212" from-port="0" to-layer="2213" to-port="0" /> + <edge from-layer="2213" from-port="1" to-layer="2216" to-port="0" /> + <edge from-layer="2214" from-port="0" to-layer="2215" to-port="0" /> + <edge from-layer="2215" from-port="1" to-layer="2216" to-port="1" /> + <edge from-layer="2216" from-port="2" to-layer="2218" to-port="0" /> + <edge from-layer="2217" from-port="0" to-layer="2218" to-port="1" /> + <edge from-layer="2218" from-port="2" to-layer="2220" to-port="0" /> + <edge from-layer="2219" from-port="0" to-layer="2220" to-port="1" /> + <edge from-layer="2220" from-port="2" to-layer="2221" to-port="0" /> + <edge from-layer="2221" from-port="1" to-layer="2222" to-port="1" /> + <edge from-layer="2222" from-port="2" to-layer="2223" to-port="1" /> + <edge from-layer="2223" from-port="2" to-layer="2234" to-port="0" /> + <edge from-layer="2224" from-port="0" to-layer="2225" to-port="0" /> + <edge from-layer="2225" from-port="1" to-layer="2228" to-port="0" /> + <edge from-layer="2226" from-port="0" to-layer="2227" to-port="0" /> + <edge from-layer="2227" from-port="1" to-layer="2228" to-port="1" /> + <edge from-layer="2228" from-port="2" to-layer="2230" to-port="0" /> + <edge from-layer="2229" from-port="0" to-layer="2230" to-port="1" /> + <edge from-layer="2230" from-port="2" to-layer="2232" to-port="0" /> + <edge from-layer="2231" from-port="0" to-layer="2232" to-port="1" /> + <edge from-layer="2232" from-port="2" to-layer="2233" to-port="0" /> + <edge from-layer="2233" from-port="1" to-layer="2234" to-port="1" /> + <edge from-layer="2234" from-port="2" to-layer="2235" to-port="1" /> + <edge from-layer="2235" from-port="2" to-layer="2245" to-port="0" /> + <edge from-layer="2235" from-port="2" to-layer="2238" to-port="0" /> + <edge from-layer="2235" from-port="2" to-layer="2429" to-port="0" /> + <edge from-layer="2236" from-port="0" to-layer="2244" to-port="0" /> + <edge from-layer="2237" from-port="0" to-layer="2238" to-port="1" /> + <edge from-layer="2238" from-port="2" to-layer="2240" to-port="0" /> + <edge from-layer="2239" from-port="0" to-layer="2240" to-port="1" /> + <edge from-layer="2240" from-port="2" to-layer="2242" to-port="0" /> + <edge from-layer="2241" from-port="0" to-layer="2242" to-port="1" /> + <edge from-layer="2242" from-port="2" to-layer="2243" to-port="0" /> + <edge from-layer="2243" from-port="1" to-layer="2244" to-port="1" /> + <edge from-layer="2244" from-port="2" to-layer="2245" to-port="1" /> + <edge from-layer="2245" from-port="2" to-layer="2246" to-port="1" /> + <edge from-layer="2246" from-port="2" to-layer="2257" to-port="0" /> + <edge from-layer="2246" from-port="2" to-layer="2286" to-port="0" /> + <edge from-layer="2246" from-port="2" to-layer="2345" to-port="0" /> + <edge from-layer="2247" from-port="0" to-layer="2248" to-port="0" /> + <edge from-layer="2248" from-port="1" to-layer="2251" to-port="0" /> + <edge from-layer="2249" from-port="0" to-layer="2250" to-port="0" /> + <edge from-layer="2250" from-port="1" to-layer="2251" to-port="1" /> + <edge from-layer="2251" from-port="2" to-layer="2253" to-port="0" /> + <edge from-layer="2252" from-port="0" to-layer="2253" to-port="1" /> + <edge from-layer="2253" from-port="2" to-layer="2255" to-port="0" /> + <edge from-layer="2254" from-port="0" to-layer="2255" to-port="1" /> + <edge from-layer="2255" from-port="2" to-layer="2256" to-port="0" /> + <edge from-layer="2256" from-port="1" to-layer="2257" to-port="1" /> + <edge from-layer="2257" from-port="2" to-layer="2260" to-port="0" /> + <edge from-layer="2258" from-port="0" to-layer="2259" to-port="0" /> + <edge from-layer="2259" from-port="1" to-layer="2260" to-port="1" /> + <edge from-layer="2260" from-port="2" to-layer="2262" to-port="0" /> + <edge from-layer="2261" from-port="0" to-layer="2262" to-port="1" /> + <edge from-layer="2262" from-port="2" to-layer="2264" to-port="0" /> + <edge from-layer="2263" from-port="0" to-layer="2264" to-port="1" /> + <edge from-layer="2264" from-port="2" to-layer="2265" to-port="1" /> + <edge from-layer="2265" from-port="2" to-layer="2387" to-port="0" /> + <edge from-layer="2265" from-port="2" to-layer="2266" to-port="0" /> + <edge from-layer="2265" from-port="2" to-layer="2388" to-port="0" /> + <edge from-layer="2267" from-port="0" to-layer="2272" to-port="0" /> + <edge from-layer="2268" from-port="0" to-layer="2271" to-port="1" /> + <edge from-layer="2269" from-port="0" to-layer="2271" to-port="2" /> + <edge from-layer="2270" from-port="0" to-layer="2271" to-port="3" /> + <edge from-layer="2271" from-port="4" to-layer="2272" to-port="1" /> + <edge from-layer="2272" from-port="2" to-layer="2273" to-port="0" /> + <edge from-layer="2273" from-port="1" to-layer="2275" to-port="0" /> + <edge from-layer="2274" from-port="0" to-layer="2275" to-port="2" /> + <edge from-layer="2275" from-port="3" to-layer="2315" to-port="0" /> + <edge from-layer="2275" from-port="3" to-layer="2401" to-port="0" /> + <edge from-layer="2276" from-port="0" to-layer="2277" to-port="0" /> + <edge from-layer="2277" from-port="1" to-layer="2280" to-port="0" /> + <edge from-layer="2278" from-port="0" to-layer="2279" to-port="0" /> + <edge from-layer="2279" from-port="1" to-layer="2280" to-port="1" /> + <edge from-layer="2280" from-port="2" to-layer="2282" to-port="0" /> + <edge from-layer="2281" from-port="0" to-layer="2282" to-port="1" /> + <edge from-layer="2282" from-port="2" to-layer="2284" to-port="0" /> + <edge from-layer="2283" from-port="0" to-layer="2284" to-port="1" /> + <edge from-layer="2284" from-port="2" to-layer="2285" to-port="0" /> + <edge from-layer="2285" from-port="1" to-layer="2286" to-port="1" /> + <edge from-layer="2286" from-port="2" to-layer="2289" to-port="0" /> + <edge from-layer="2287" from-port="0" to-layer="2288" to-port="0" /> + <edge from-layer="2288" from-port="1" to-layer="2289" to-port="1" /> + <edge from-layer="2289" from-port="2" to-layer="2291" to-port="0" /> + <edge from-layer="2290" from-port="0" to-layer="2291" to-port="1" /> + <edge from-layer="2291" from-port="2" to-layer="2293" to-port="0" /> + <edge from-layer="2292" from-port="0" to-layer="2293" to-port="1" /> + <edge from-layer="2293" from-port="2" to-layer="2305" to-port="0" /> + <edge from-layer="2293" from-port="2" to-layer="2311" to-port="0" /> + <edge from-layer="2293" from-port="2" to-layer="2295" to-port="0" /> + <edge from-layer="2293" from-port="2" to-layer="2294" to-port="0" /> + <edge from-layer="2294" from-port="2" to-layer="2314" to-port="0" /> + <edge from-layer="2295" from-port="1" to-layer="2297" to-port="0" /> + <edge from-layer="2296" from-port="0" to-layer="2297" to-port="2" /> + <edge from-layer="2297" from-port="3" to-layer="2298" to-port="0" /> + <edge from-layer="2298" from-port="2" to-layer="2299" to-port="0" /> + <edge from-layer="2299" from-port="1" to-layer="2301" to-port="0" /> + <edge from-layer="2300" from-port="0" to-layer="2301" to-port="1" /> + <edge from-layer="2301" from-port="2" to-layer="2311" to-port="2" /> + <edge from-layer="2301" from-port="2" to-layer="2305" to-port="1" /> + <edge from-layer="2302" from-port="0" to-layer="2305" to-port="2" /> + <edge from-layer="2303" from-port="0" to-layer="2305" to-port="3" /> + <edge from-layer="2304" from-port="0" to-layer="2305" to-port="4" /> + <edge from-layer="2305" from-port="5" to-layer="2307" to-port="0" /> + <edge from-layer="2306" from-port="0" to-layer="2307" to-port="1" /> + <edge from-layer="2307" from-port="2" to-layer="2312" to-port="0" /> + <edge from-layer="2308" from-port="0" to-layer="2311" to-port="1" /> + <edge from-layer="2309" from-port="0" to-layer="2311" to-port="3" /> + <edge from-layer="2310" from-port="0" to-layer="2311" to-port="4" /> + <edge from-layer="2311" from-port="5" to-layer="2312" to-port="1" /> + <edge from-layer="2312" from-port="2" to-layer="2313" to-port="0" /> + <edge from-layer="2313" from-port="2" to-layer="2314" to-port="1" /> + <edge from-layer="2314" from-port="2" to-layer="2315" to-port="1" /> + <edge from-layer="2314" from-port="2" to-layer="2405" to-port="0" /> + <edge from-layer="2315" from-port="2" to-layer="2375" to-port="0" /> + <edge from-layer="2315" from-port="2" to-layer="2374" to-port="0" /> + <edge from-layer="2315" from-port="2" to-layer="2316" to-port="0" /> + <edge from-layer="2325" from-port="0" to-layer="2330" to-port="0" /> + <edge from-layer="2326" from-port="0" to-layer="2329" to-port="1" /> + <edge from-layer="2327" from-port="0" to-layer="2329" to-port="2" /> + <edge from-layer="2328" from-port="0" to-layer="2329" to-port="3" /> + <edge from-layer="2329" from-port="4" to-layer="2330" to-port="1" /> + <edge from-layer="2330" from-port="2" to-layer="2331" to-port="0" /> + <edge from-layer="2331" from-port="1" to-layer="2333" to-port="0" /> + <edge from-layer="2332" from-port="0" to-layer="2333" to-port="2" /> + <edge from-layer="2333" from-port="3" to-layer="11091" to-port="0" /> + <edge from-layer="2334" from-port="0" to-layer="11072" to-port="0" /> + <edge from-layer="2335" from-port="0" to-layer="2336" to-port="0" /> + <edge from-layer="2336" from-port="1" to-layer="2339" to-port="0" /> + <edge from-layer="2337" from-port="0" to-layer="2338" to-port="0" /> + <edge from-layer="2338" from-port="1" to-layer="2339" to-port="1" /> + <edge from-layer="2339" from-port="2" to-layer="2341" to-port="0" /> + <edge from-layer="2340" from-port="0" to-layer="2341" to-port="1" /> + <edge from-layer="2341" from-port="2" to-layer="2343" to-port="0" /> + <edge from-layer="2342" from-port="0" to-layer="2343" to-port="1" /> + <edge from-layer="2343" from-port="2" to-layer="2344" to-port="0" /> + <edge from-layer="2344" from-port="1" to-layer="2345" to-port="1" /> + <edge from-layer="2345" from-port="2" to-layer="2348" to-port="0" /> + <edge from-layer="2346" from-port="0" to-layer="2347" to-port="0" /> + <edge from-layer="2347" from-port="1" to-layer="2348" to-port="1" /> + <edge from-layer="2348" from-port="2" to-layer="2350" to-port="0" /> + <edge from-layer="2349" from-port="0" to-layer="2350" to-port="1" /> + <edge from-layer="2350" from-port="2" to-layer="2352" to-port="0" /> + <edge from-layer="2351" from-port="0" to-layer="2352" to-port="1" /> + <edge from-layer="2352" from-port="2" to-layer="2353" to-port="0" /> + <edge from-layer="2352" from-port="2" to-layer="2354" to-port="0" /> + <edge from-layer="2352" from-port="2" to-layer="2370" to-port="0" /> + <edge from-layer="2352" from-port="2" to-layer="2364" to-port="0" /> + <edge from-layer="2353" from-port="2" to-layer="2373" to-port="0" /> + <edge from-layer="2354" from-port="1" to-layer="2356" to-port="0" /> + <edge from-layer="2355" from-port="0" to-layer="2356" to-port="2" /> + <edge from-layer="2356" from-port="3" to-layer="2357" to-port="0" /> + <edge from-layer="2357" from-port="2" to-layer="2358" to-port="0" /> + <edge from-layer="2358" from-port="1" to-layer="2360" to-port="0" /> + <edge from-layer="2359" from-port="0" to-layer="2360" to-port="1" /> + <edge from-layer="2360" from-port="2" to-layer="2364" to-port="1" /> + <edge from-layer="2360" from-port="2" to-layer="2370" to-port="2" /> + <edge from-layer="2361" from-port="0" to-layer="2364" to-port="2" /> + <edge from-layer="2362" from-port="0" to-layer="2364" to-port="3" /> + <edge from-layer="2363" from-port="0" to-layer="2364" to-port="4" /> + <edge from-layer="2364" from-port="5" to-layer="2366" to-port="0" /> + <edge from-layer="2365" from-port="0" to-layer="2366" to-port="1" /> + <edge from-layer="2366" from-port="2" to-layer="2371" to-port="0" /> + <edge from-layer="2367" from-port="0" to-layer="2370" to-port="1" /> + <edge from-layer="2368" from-port="0" to-layer="2370" to-port="3" /> + <edge from-layer="2369" from-port="0" to-layer="2370" to-port="4" /> + <edge from-layer="2370" from-port="5" to-layer="2371" to-port="1" /> + <edge from-layer="2371" from-port="2" to-layer="2372" to-port="0" /> + <edge from-layer="2372" from-port="2" to-layer="2373" to-port="1" /> + <edge from-layer="2373" from-port="2" to-layer="2413" to-port="0" /> + <edge from-layer="2374" from-port="2" to-layer="2384" to-port="0" /> + <edge from-layer="2375" from-port="1" to-layer="2382" to-port="0" /> + <edge from-layer="2375" from-port="1" to-layer="2378" to-port="0" /> + <edge from-layer="2376" from-port="0" to-layer="2378" to-port="1" /> + <edge from-layer="2377" from-port="0" to-layer="2378" to-port="2" /> + <edge from-layer="2378" from-port="3" to-layer="2383" to-port="0" /> + <edge from-layer="2379" from-port="0" to-layer="2383" to-port="1" /> + <edge from-layer="2380" from-port="0" to-layer="2382" to-port="1" /> + <edge from-layer="2381" from-port="0" to-layer="2382" to-port="2" /> + <edge from-layer="2382" from-port="3" to-layer="2383" to-port="2" /> + <edge from-layer="2383" from-port="3" to-layer="2384" to-port="1" /> + <edge from-layer="2384" from-port="2" to-layer="2386" to-port="0" /> + <edge from-layer="2385" from-port="0" to-layer="2386" to-port="1" /> + <edge from-layer="2386" from-port="2" to-layer="2413" to-port="1" /> + <edge from-layer="2387" from-port="2" to-layer="2397" to-port="0" /> + <edge from-layer="2388" from-port="1" to-layer="2395" to-port="0" /> + <edge from-layer="2388" from-port="1" to-layer="2391" to-port="0" /> + <edge from-layer="2389" from-port="0" to-layer="2391" to-port="1" /> + <edge from-layer="2390" from-port="0" to-layer="2391" to-port="2" /> + <edge from-layer="2391" from-port="3" to-layer="2396" to-port="1" /> + <edge from-layer="2392" from-port="0" to-layer="2396" to-port="2" /> + <edge from-layer="2393" from-port="0" to-layer="2395" to-port="1" /> + <edge from-layer="2394" from-port="0" to-layer="2395" to-port="2" /> + <edge from-layer="2395" from-port="3" to-layer="2396" to-port="3" /> + <edge from-layer="2396" from-port="4" to-layer="2397" to-port="1" /> + <edge from-layer="2397" from-port="2" to-layer="2399" to-port="0" /> + <edge from-layer="2398" from-port="0" to-layer="2399" to-port="1" /> + <edge from-layer="2399" from-port="2" to-layer="2413" to-port="2" /> + <edge from-layer="2400" from-port="0" to-layer="2412" to-port="1" /> + <edge from-layer="2401" from-port="1" to-layer="2404" to-port="0" /> + <edge from-layer="2402" from-port="0" to-layer="2404" to-port="1" /> + <edge from-layer="2403" from-port="0" to-layer="2404" to-port="2" /> + <edge from-layer="2404" from-port="3" to-layer="2409" to-port="0" /> + <edge from-layer="2405" from-port="1" to-layer="2408" to-port="0" /> + <edge from-layer="2406" from-port="0" to-layer="2408" to-port="1" /> + <edge from-layer="2407" from-port="0" to-layer="2408" to-port="2" /> + <edge from-layer="2408" from-port="3" to-layer="2409" to-port="1" /> + <edge from-layer="2409" from-port="2" to-layer="2412" to-port="2" /> + <edge from-layer="2410" from-port="0" to-layer="2412" to-port="3" /> + <edge from-layer="2411" from-port="0" to-layer="2412" to-port="4" /> + <edge from-layer="2412" from-port="5" to-layer="2413" to-port="3" /> + <edge from-layer="2413" from-port="4" to-layer="2415" to-port="0" /> + <edge from-layer="2414" from-port="0" to-layer="2415" to-port="1" /> + <edge from-layer="2415" from-port="2" to-layer="2417" to-port="0" /> + <edge from-layer="2416" from-port="0" to-layer="2417" to-port="1" /> + <edge from-layer="2417" from-port="2" to-layer="2428" to-port="0" /> + <edge from-layer="2418" from-port="0" to-layer="2419" to-port="0" /> + <edge from-layer="2419" from-port="1" to-layer="2422" to-port="0" /> + <edge from-layer="2420" from-port="0" to-layer="2421" to-port="0" /> + <edge from-layer="2421" from-port="1" to-layer="2422" to-port="1" /> + <edge from-layer="2422" from-port="2" to-layer="2424" to-port="0" /> + <edge from-layer="2423" from-port="0" to-layer="2424" to-port="1" /> + <edge from-layer="2424" from-port="2" to-layer="2426" to-port="0" /> + <edge from-layer="2425" from-port="0" to-layer="2426" to-port="1" /> + <edge from-layer="2426" from-port="2" to-layer="2427" to-port="0" /> + <edge from-layer="2427" from-port="1" to-layer="2428" to-port="1" /> + <edge from-layer="2428" from-port="2" to-layer="2429" to-port="1" /> + <edge from-layer="2429" from-port="2" to-layer="2477" to-port="0" /> + <edge from-layer="2429" from-port="2" to-layer="2433" to-port="0" /> + <edge from-layer="2429" from-port="2" to-layer="2440" to-port="0" /> + <edge from-layer="2430" from-port="0" to-layer="2441" to-port="0" /> + <edge from-layer="2431" from-port="0" to-layer="2439" to-port="0" /> + <edge from-layer="2432" from-port="0" to-layer="2433" to-port="1" /> + <edge from-layer="2433" from-port="2" to-layer="2435" to-port="0" /> + <edge from-layer="2434" from-port="0" to-layer="2435" to-port="1" /> + <edge from-layer="2435" from-port="2" to-layer="2437" to-port="0" /> + <edge from-layer="2436" from-port="0" to-layer="2437" to-port="1" /> + <edge from-layer="2437" from-port="2" to-layer="2438" to-port="0" /> + <edge from-layer="2438" from-port="1" to-layer="2439" to-port="1" /> + <edge from-layer="2439" from-port="2" to-layer="2440" to-port="1" /> + <edge from-layer="2440" from-port="2" to-layer="2441" to-port="1" /> + <edge from-layer="2441" from-port="2" to-layer="2452" to-port="0" /> + <edge from-layer="2441" from-port="2" to-layer="2464" to-port="0" /> + <edge from-layer="2442" from-port="0" to-layer="2443" to-port="0" /> + <edge from-layer="2443" from-port="1" to-layer="2446" to-port="0" /> + <edge from-layer="2444" from-port="0" to-layer="2445" to-port="0" /> + <edge from-layer="2445" from-port="1" to-layer="2446" to-port="1" /> + <edge from-layer="2446" from-port="2" to-layer="2448" to-port="0" /> + <edge from-layer="2447" from-port="0" to-layer="2448" to-port="1" /> + <edge from-layer="2448" from-port="2" to-layer="2450" to-port="0" /> + <edge from-layer="2449" from-port="0" to-layer="2450" to-port="1" /> + <edge from-layer="2450" from-port="2" to-layer="2451" to-port="0" /> + <edge from-layer="2451" from-port="1" to-layer="2452" to-port="1" /> + <edge from-layer="2452" from-port="2" to-layer="2453" to-port="0" /> + <edge from-layer="2453" from-port="1" to-layer="2465" to-port="0" /> + <edge from-layer="2454" from-port="0" to-layer="2455" to-port="0" /> + <edge from-layer="2455" from-port="1" to-layer="2458" to-port="0" /> + <edge from-layer="2456" from-port="0" to-layer="2457" to-port="0" /> + <edge from-layer="2457" from-port="1" to-layer="2458" to-port="1" /> + <edge from-layer="2458" from-port="2" to-layer="2460" to-port="0" /> + <edge from-layer="2459" from-port="0" to-layer="2460" to-port="1" /> + <edge from-layer="2460" from-port="2" to-layer="2462" to-port="0" /> + <edge from-layer="2461" from-port="0" to-layer="2462" to-port="1" /> + <edge from-layer="2462" from-port="2" to-layer="2463" to-port="0" /> + <edge from-layer="2463" from-port="1" to-layer="2464" to-port="1" /> + <edge from-layer="2464" from-port="2" to-layer="2465" to-port="1" /> + <edge from-layer="2465" from-port="2" to-layer="2476" to-port="0" /> + <edge from-layer="2466" from-port="0" to-layer="2467" to-port="0" /> + <edge from-layer="2467" from-port="1" to-layer="2470" to-port="0" /> + <edge from-layer="2468" from-port="0" to-layer="2469" to-port="0" /> + <edge from-layer="2469" from-port="1" to-layer="2470" to-port="1" /> + <edge from-layer="2470" from-port="2" to-layer="2472" to-port="0" /> + <edge from-layer="2471" from-port="0" to-layer="2472" to-port="1" /> + <edge from-layer="2472" from-port="2" to-layer="2474" to-port="0" /> + <edge from-layer="2473" from-port="0" to-layer="2474" to-port="1" /> + <edge from-layer="2474" from-port="2" to-layer="2475" to-port="0" /> + <edge from-layer="2475" from-port="1" to-layer="2476" to-port="1" /> + <edge from-layer="2476" from-port="2" to-layer="2477" to-port="1" /> + <edge from-layer="2477" from-port="2" to-layer="2481" to-port="0" /> + <edge from-layer="2477" from-port="2" to-layer="2661" to-port="0" /> + <edge from-layer="2477" from-port="2" to-layer="2488" to-port="0" /> + <edge from-layer="2478" from-port="0" to-layer="2489" to-port="0" /> + <edge from-layer="2479" from-port="0" to-layer="2487" to-port="0" /> + <edge from-layer="2480" from-port="0" to-layer="2481" to-port="1" /> + <edge from-layer="2481" from-port="2" to-layer="2483" to-port="0" /> + <edge from-layer="2482" from-port="0" to-layer="2483" to-port="1" /> + <edge from-layer="2483" from-port="2" to-layer="2485" to-port="0" /> + <edge from-layer="2484" from-port="0" to-layer="2485" to-port="1" /> + <edge from-layer="2485" from-port="2" to-layer="2486" to-port="0" /> + <edge from-layer="2486" from-port="1" to-layer="2487" to-port="1" /> + <edge from-layer="2487" from-port="2" to-layer="2488" to-port="1" /> + <edge from-layer="2488" from-port="2" to-layer="2489" to-port="1" /> + <edge from-layer="2489" from-port="2" to-layer="2610" to-port="0" /> + <edge from-layer="2489" from-port="2" to-layer="2548" to-port="0" /> + <edge from-layer="2489" from-port="2" to-layer="2500" to-port="0" /> + <edge from-layer="2490" from-port="0" to-layer="2491" to-port="0" /> + <edge from-layer="2491" from-port="1" to-layer="2494" to-port="0" /> + <edge from-layer="2492" from-port="0" to-layer="2493" to-port="0" /> + <edge from-layer="2493" from-port="1" to-layer="2494" to-port="1" /> + <edge from-layer="2494" from-port="2" to-layer="2496" to-port="0" /> + <edge from-layer="2495" from-port="0" to-layer="2496" to-port="1" /> + <edge from-layer="2496" from-port="2" to-layer="2498" to-port="0" /> + <edge from-layer="2497" from-port="0" to-layer="2498" to-port="1" /> + <edge from-layer="2498" from-port="2" to-layer="2499" to-port="0" /> + <edge from-layer="2499" from-port="1" to-layer="2500" to-port="1" /> + <edge from-layer="2500" from-port="2" to-layer="2503" to-port="0" /> + <edge from-layer="2501" from-port="0" to-layer="2502" to-port="0" /> + <edge from-layer="2502" from-port="1" to-layer="2503" to-port="1" /> + <edge from-layer="2503" from-port="2" to-layer="2505" to-port="0" /> + <edge from-layer="2504" from-port="0" to-layer="2505" to-port="1" /> + <edge from-layer="2505" from-port="2" to-layer="2507" to-port="0" /> + <edge from-layer="2506" from-port="0" to-layer="2507" to-port="1" /> + <edge from-layer="2507" from-port="2" to-layer="2508" to-port="0" /> + <edge from-layer="2507" from-port="2" to-layer="2509" to-port="0" /> + <edge from-layer="2507" from-port="2" to-layer="2525" to-port="0" /> + <edge from-layer="2507" from-port="2" to-layer="2519" to-port="0" /> + <edge from-layer="2508" from-port="2" to-layer="2528" to-port="0" /> + <edge from-layer="2509" from-port="1" to-layer="2511" to-port="0" /> + <edge from-layer="2510" from-port="0" to-layer="2511" to-port="2" /> + <edge from-layer="2511" from-port="3" to-layer="2512" to-port="0" /> + <edge from-layer="2512" from-port="2" to-layer="2513" to-port="0" /> + <edge from-layer="2513" from-port="1" to-layer="2515" to-port="0" /> + <edge from-layer="2514" from-port="0" to-layer="2515" to-port="1" /> + <edge from-layer="2515" from-port="2" to-layer="2519" to-port="1" /> + <edge from-layer="2515" from-port="2" to-layer="2525" to-port="2" /> + <edge from-layer="2516" from-port="0" to-layer="2519" to-port="2" /> + <edge from-layer="2517" from-port="0" to-layer="2519" to-port="3" /> + <edge from-layer="2518" from-port="0" to-layer="2519" to-port="4" /> + <edge from-layer="2519" from-port="5" to-layer="2521" to-port="0" /> + <edge from-layer="2520" from-port="0" to-layer="2521" to-port="1" /> + <edge from-layer="2521" from-port="2" to-layer="2526" to-port="0" /> + <edge from-layer="2522" from-port="0" to-layer="2525" to-port="1" /> + <edge from-layer="2523" from-port="0" to-layer="2525" to-port="3" /> + <edge from-layer="2524" from-port="0" to-layer="2525" to-port="4" /> + <edge from-layer="2525" from-port="5" to-layer="2526" to-port="1" /> + <edge from-layer="2526" from-port="2" to-layer="2527" to-port="0" /> + <edge from-layer="2527" from-port="2" to-layer="2528" to-port="1" /> + <edge from-layer="2528" from-port="2" to-layer="2645" to-port="0" /> + <edge from-layer="2529" from-port="0" to-layer="2534" to-port="0" /> + <edge from-layer="2530" from-port="0" to-layer="2533" to-port="1" /> + <edge from-layer="2531" from-port="0" to-layer="2533" to-port="2" /> + <edge from-layer="2532" from-port="0" to-layer="2533" to-port="3" /> + <edge from-layer="2533" from-port="4" to-layer="2534" to-port="1" /> + <edge from-layer="2534" from-port="2" to-layer="2535" to-port="0" /> + <edge from-layer="2535" from-port="1" to-layer="2537" to-port="0" /> + <edge from-layer="2536" from-port="0" to-layer="2537" to-port="2" /> + <edge from-layer="2537" from-port="3" to-layer="2577" to-port="0" /> + <edge from-layer="2537" from-port="3" to-layer="2633" to-port="0" /> + <edge from-layer="2538" from-port="0" to-layer="2539" to-port="0" /> + <edge from-layer="2539" from-port="1" to-layer="2542" to-port="0" /> + <edge from-layer="2540" from-port="0" to-layer="2541" to-port="0" /> + <edge from-layer="2541" from-port="1" to-layer="2542" to-port="1" /> + <edge from-layer="2542" from-port="2" to-layer="2544" to-port="0" /> + <edge from-layer="2543" from-port="0" to-layer="2544" to-port="1" /> + <edge from-layer="2544" from-port="2" to-layer="2546" to-port="0" /> + <edge from-layer="2545" from-port="0" to-layer="2546" to-port="1" /> + <edge from-layer="2546" from-port="2" to-layer="2547" to-port="0" /> + <edge from-layer="2547" from-port="1" to-layer="2548" to-port="1" /> + <edge from-layer="2548" from-port="2" to-layer="2551" to-port="0" /> + <edge from-layer="2549" from-port="0" to-layer="2550" to-port="0" /> + <edge from-layer="2550" from-port="1" to-layer="2551" to-port="1" /> + <edge from-layer="2551" from-port="2" to-layer="2553" to-port="0" /> + <edge from-layer="2552" from-port="0" to-layer="2553" to-port="1" /> + <edge from-layer="2553" from-port="2" to-layer="2555" to-port="0" /> + <edge from-layer="2554" from-port="0" to-layer="2555" to-port="1" /> + <edge from-layer="2555" from-port="2" to-layer="2573" to-port="0" /> + <edge from-layer="2555" from-port="2" to-layer="2567" to-port="0" /> + <edge from-layer="2555" from-port="2" to-layer="2557" to-port="0" /> + <edge from-layer="2555" from-port="2" to-layer="2556" to-port="0" /> + <edge from-layer="2556" from-port="2" to-layer="2576" to-port="0" /> + <edge from-layer="2557" from-port="1" to-layer="2559" to-port="0" /> + <edge from-layer="2558" from-port="0" to-layer="2559" to-port="2" /> + <edge from-layer="2559" from-port="3" to-layer="2560" to-port="0" /> + <edge from-layer="2560" from-port="2" to-layer="2561" to-port="0" /> + <edge from-layer="2561" from-port="1" to-layer="2563" to-port="0" /> + <edge from-layer="2562" from-port="0" to-layer="2563" to-port="1" /> + <edge from-layer="2563" from-port="2" to-layer="2567" to-port="1" /> + <edge from-layer="2563" from-port="2" to-layer="2573" to-port="2" /> + <edge from-layer="2564" from-port="0" to-layer="2567" to-port="2" /> + <edge from-layer="2565" from-port="0" to-layer="2567" to-port="3" /> + <edge from-layer="2566" from-port="0" to-layer="2567" to-port="4" /> + <edge from-layer="2567" from-port="5" to-layer="2569" to-port="0" /> + <edge from-layer="2568" from-port="0" to-layer="2569" to-port="1" /> + <edge from-layer="2569" from-port="2" to-layer="2574" to-port="0" /> + <edge from-layer="2570" from-port="0" to-layer="2573" to-port="1" /> + <edge from-layer="2571" from-port="0" to-layer="2573" to-port="3" /> + <edge from-layer="2572" from-port="0" to-layer="2573" to-port="4" /> + <edge from-layer="2573" from-port="5" to-layer="2574" to-port="1" /> + <edge from-layer="2574" from-port="2" to-layer="2575" to-port="0" /> + <edge from-layer="2575" from-port="2" to-layer="2576" to-port="1" /> + <edge from-layer="2576" from-port="2" to-layer="2577" to-port="1" /> + <edge from-layer="2576" from-port="2" to-layer="2637" to-port="0" /> + <edge from-layer="2577" from-port="2" to-layer="2578" to-port="0" /> + <edge from-layer="2577" from-port="2" to-layer="2579" to-port="0" /> + <edge from-layer="2577" from-port="2" to-layer="11222" to-port="0" /> + <edge from-layer="2578" from-port="2" to-layer="2588" to-port="0" /> + <edge from-layer="2579" from-port="1" to-layer="2582" to-port="0" /> + <edge from-layer="2579" from-port="1" to-layer="2586" to-port="0" /> + <edge from-layer="2580" from-port="0" to-layer="2582" to-port="1" /> + <edge from-layer="2581" from-port="0" to-layer="2582" to-port="2" /> + <edge from-layer="2582" from-port="3" to-layer="2587" to-port="0" /> + <edge from-layer="2583" from-port="0" to-layer="2587" to-port="1" /> + <edge from-layer="2584" from-port="0" to-layer="2586" to-port="1" /> + <edge from-layer="2585" from-port="0" to-layer="2586" to-port="2" /> + <edge from-layer="2586" from-port="3" to-layer="2587" to-port="2" /> + <edge from-layer="2587" from-port="3" to-layer="2588" to-port="1" /> + <edge from-layer="2588" from-port="2" to-layer="2590" to-port="0" /> + <edge from-layer="2589" from-port="0" to-layer="2590" to-port="1" /> + <edge from-layer="2590" from-port="2" to-layer="2645" to-port="1" /> + <edge from-layer="2591" from-port="0" to-layer="2596" to-port="0" /> + <edge from-layer="2592" from-port="0" to-layer="2595" to-port="1" /> + <edge from-layer="2593" from-port="0" to-layer="2595" to-port="2" /> + <edge from-layer="2594" from-port="0" to-layer="2595" to-port="3" /> + <edge from-layer="2595" from-port="4" to-layer="2596" to-port="1" /> + <edge from-layer="2596" from-port="2" to-layer="2597" to-port="0" /> + <edge from-layer="2597" from-port="1" to-layer="2599" to-port="0" /> + <edge from-layer="2598" from-port="0" to-layer="2599" to-port="2" /> + <edge from-layer="2599" from-port="3" to-layer="2618" to-port="0" /> + <edge from-layer="2600" from-port="0" to-layer="2601" to-port="0" /> + <edge from-layer="2601" from-port="1" to-layer="2604" to-port="0" /> + <edge from-layer="2602" from-port="0" to-layer="2603" to-port="0" /> + <edge from-layer="2603" from-port="1" to-layer="2604" to-port="1" /> + <edge from-layer="2604" from-port="2" to-layer="2606" to-port="0" /> + <edge from-layer="2605" from-port="0" to-layer="2606" to-port="1" /> + <edge from-layer="2606" from-port="2" to-layer="2608" to-port="0" /> + <edge from-layer="2607" from-port="0" to-layer="2608" to-port="1" /> + <edge from-layer="2608" from-port="2" to-layer="2609" to-port="0" /> + <edge from-layer="2609" from-port="1" to-layer="2610" to-port="1" /> + <edge from-layer="2610" from-port="2" to-layer="2613" to-port="0" /> + <edge from-layer="2611" from-port="0" to-layer="2612" to-port="0" /> + <edge from-layer="2612" from-port="1" to-layer="2613" to-port="1" /> + <edge from-layer="2613" from-port="2" to-layer="2615" to-port="0" /> + <edge from-layer="2614" from-port="0" to-layer="2615" to-port="1" /> + <edge from-layer="2615" from-port="2" to-layer="2617" to-port="0" /> + <edge from-layer="2616" from-port="0" to-layer="2617" to-port="1" /> + <edge from-layer="2617" from-port="2" to-layer="2618" to-port="1" /> + <edge from-layer="2618" from-port="2" to-layer="11221" to-port="0" /> + <edge from-layer="2618" from-port="2" to-layer="2619" to-port="0" /> + <edge from-layer="2618" from-port="2" to-layer="2620" to-port="0" /> + <edge from-layer="2619" from-port="2" to-layer="2629" to-port="0" /> + <edge from-layer="2620" from-port="1" to-layer="2623" to-port="0" /> + <edge from-layer="2620" from-port="1" to-layer="2627" to-port="0" /> + <edge from-layer="2621" from-port="0" to-layer="2623" to-port="1" /> + <edge from-layer="2622" from-port="0" to-layer="2623" to-port="2" /> + <edge from-layer="2623" from-port="3" to-layer="2628" to-port="1" /> + <edge from-layer="2624" from-port="0" to-layer="2628" to-port="2" /> + <edge from-layer="2625" from-port="0" to-layer="2627" to-port="1" /> + <edge from-layer="2626" from-port="0" to-layer="2627" to-port="2" /> + <edge from-layer="2627" from-port="3" to-layer="2628" to-port="3" /> + <edge from-layer="2628" from-port="4" to-layer="2629" to-port="1" /> + <edge from-layer="2629" from-port="2" to-layer="2631" to-port="0" /> + <edge from-layer="2630" from-port="0" to-layer="2631" to-port="1" /> + <edge from-layer="2631" from-port="2" to-layer="2645" to-port="2" /> + <edge from-layer="2632" from-port="0" to-layer="2644" to-port="1" /> + <edge from-layer="2633" from-port="1" to-layer="2636" to-port="0" /> + <edge from-layer="2634" from-port="0" to-layer="2636" to-port="1" /> + <edge from-layer="2635" from-port="0" to-layer="2636" to-port="2" /> + <edge from-layer="2636" from-port="3" to-layer="2641" to-port="0" /> + <edge from-layer="2637" from-port="1" to-layer="2640" to-port="0" /> + <edge from-layer="2638" from-port="0" to-layer="2640" to-port="1" /> + <edge from-layer="2639" from-port="0" to-layer="2640" to-port="2" /> + <edge from-layer="2640" from-port="3" to-layer="2641" to-port="1" /> + <edge from-layer="2641" from-port="2" to-layer="2644" to-port="2" /> + <edge from-layer="2642" from-port="0" to-layer="2644" to-port="3" /> + <edge from-layer="2643" from-port="0" to-layer="2644" to-port="4" /> + <edge from-layer="2644" from-port="5" to-layer="2645" to-port="3" /> + <edge from-layer="2645" from-port="4" to-layer="2647" to-port="0" /> + <edge from-layer="2646" from-port="0" to-layer="2647" to-port="1" /> + <edge from-layer="2647" from-port="2" to-layer="2649" to-port="0" /> + <edge from-layer="2648" from-port="0" to-layer="2649" to-port="1" /> + <edge from-layer="2649" from-port="2" to-layer="2660" to-port="0" /> + <edge from-layer="2650" from-port="0" to-layer="2651" to-port="0" /> + <edge from-layer="2651" from-port="1" to-layer="2654" to-port="0" /> + <edge from-layer="2652" from-port="0" to-layer="2653" to-port="0" /> + <edge from-layer="2653" from-port="1" to-layer="2654" to-port="1" /> + <edge from-layer="2654" from-port="2" to-layer="2656" to-port="0" /> + <edge from-layer="2655" from-port="0" to-layer="2656" to-port="1" /> + <edge from-layer="2656" from-port="2" to-layer="2658" to-port="0" /> + <edge from-layer="2657" from-port="0" to-layer="2658" to-port="1" /> + <edge from-layer="2658" from-port="2" to-layer="2659" to-port="0" /> + <edge from-layer="2659" from-port="1" to-layer="2660" to-port="1" /> + <edge from-layer="2660" from-port="2" to-layer="2661" to-port="1" /> + <edge from-layer="2661" from-port="2" to-layer="2672" to-port="0" /> + <edge from-layer="2661" from-port="2" to-layer="2709" to-port="0" /> + <edge from-layer="2661" from-port="2" to-layer="2665" to-port="0" /> + <edge from-layer="2662" from-port="0" to-layer="2673" to-port="0" /> + <edge from-layer="2663" from-port="0" to-layer="2671" to-port="0" /> + <edge from-layer="2664" from-port="0" to-layer="2665" to-port="1" /> + <edge from-layer="2665" from-port="2" to-layer="2667" to-port="0" /> + <edge from-layer="2666" from-port="0" to-layer="2667" to-port="1" /> + <edge from-layer="2667" from-port="2" to-layer="2669" to-port="0" /> + <edge from-layer="2668" from-port="0" to-layer="2669" to-port="1" /> + <edge from-layer="2669" from-port="2" to-layer="2670" to-port="0" /> + <edge from-layer="2670" from-port="1" to-layer="2671" to-port="1" /> + <edge from-layer="2671" from-port="2" to-layer="2672" to-port="1" /> + <edge from-layer="2672" from-port="2" to-layer="2673" to-port="1" /> + <edge from-layer="2673" from-port="2" to-layer="2696" to-port="0" /> + <edge from-layer="2673" from-port="2" to-layer="2684" to-port="0" /> + <edge from-layer="2674" from-port="0" to-layer="2675" to-port="0" /> + <edge from-layer="2675" from-port="1" to-layer="2678" to-port="0" /> + <edge from-layer="2676" from-port="0" to-layer="2677" to-port="0" /> + <edge from-layer="2677" from-port="1" to-layer="2678" to-port="1" /> + <edge from-layer="2678" from-port="2" to-layer="2680" to-port="0" /> + <edge from-layer="2679" from-port="0" to-layer="2680" to-port="1" /> + <edge from-layer="2680" from-port="2" to-layer="2682" to-port="0" /> + <edge from-layer="2681" from-port="0" to-layer="2682" to-port="1" /> + <edge from-layer="2682" from-port="2" to-layer="2683" to-port="0" /> + <edge from-layer="2683" from-port="1" to-layer="2684" to-port="1" /> + <edge from-layer="2684" from-port="2" to-layer="2685" to-port="0" /> + <edge from-layer="2685" from-port="1" to-layer="2697" to-port="0" /> + <edge from-layer="2686" from-port="0" to-layer="2687" to-port="0" /> + <edge from-layer="2687" from-port="1" to-layer="2690" to-port="0" /> + <edge from-layer="2688" from-port="0" to-layer="2689" to-port="0" /> + <edge from-layer="2689" from-port="1" to-layer="2690" to-port="1" /> + <edge from-layer="2690" from-port="2" to-layer="2692" to-port="0" /> + <edge from-layer="2691" from-port="0" to-layer="2692" to-port="1" /> + <edge from-layer="2692" from-port="2" to-layer="2694" to-port="0" /> + <edge from-layer="2693" from-port="0" to-layer="2694" to-port="1" /> + <edge from-layer="2694" from-port="2" to-layer="2695" to-port="0" /> + <edge from-layer="2695" from-port="1" to-layer="2696" to-port="1" /> + <edge from-layer="2696" from-port="2" to-layer="2697" to-port="1" /> + <edge from-layer="2697" from-port="2" to-layer="2708" to-port="0" /> + <edge from-layer="2698" from-port="0" to-layer="2699" to-port="0" /> + <edge from-layer="2699" from-port="1" to-layer="2702" to-port="0" /> + <edge from-layer="2700" from-port="0" to-layer="2701" to-port="0" /> + <edge from-layer="2701" from-port="1" to-layer="2702" to-port="1" /> + <edge from-layer="2702" from-port="2" to-layer="2704" to-port="0" /> + <edge from-layer="2703" from-port="0" to-layer="2704" to-port="1" /> + <edge from-layer="2704" from-port="2" to-layer="2706" to-port="0" /> + <edge from-layer="2705" from-port="0" to-layer="2706" to-port="1" /> + <edge from-layer="2706" from-port="2" to-layer="2707" to-port="0" /> + <edge from-layer="2707" from-port="1" to-layer="2708" to-port="1" /> + <edge from-layer="2708" from-port="2" to-layer="2709" to-port="1" /> + <edge from-layer="2709" from-port="2" to-layer="2713" to-port="0" /> + <edge from-layer="2709" from-port="2" to-layer="2893" to-port="0" /> + <edge from-layer="2709" from-port="2" to-layer="2720" to-port="0" /> + <edge from-layer="2710" from-port="0" to-layer="2721" to-port="0" /> + <edge from-layer="2711" from-port="0" to-layer="2719" to-port="0" /> + <edge from-layer="2712" from-port="0" to-layer="2713" to-port="1" /> + <edge from-layer="2713" from-port="2" to-layer="2715" to-port="0" /> + <edge from-layer="2714" from-port="0" to-layer="2715" to-port="1" /> + <edge from-layer="2715" from-port="2" to-layer="2717" to-port="0" /> + <edge from-layer="2716" from-port="0" to-layer="2717" to-port="1" /> + <edge from-layer="2717" from-port="2" to-layer="2718" to-port="0" /> + <edge from-layer="2718" from-port="1" to-layer="2719" to-port="1" /> + <edge from-layer="2719" from-port="2" to-layer="2720" to-port="1" /> + <edge from-layer="2720" from-port="2" to-layer="2721" to-port="1" /> + <edge from-layer="2721" from-port="2" to-layer="2780" to-port="0" /> + <edge from-layer="2721" from-port="2" to-layer="2842" to-port="0" /> + <edge from-layer="2721" from-port="2" to-layer="2732" to-port="0" /> + <edge from-layer="2722" from-port="0" to-layer="2723" to-port="0" /> + <edge from-layer="2723" from-port="1" to-layer="2726" to-port="0" /> + <edge from-layer="2724" from-port="0" to-layer="2725" to-port="0" /> + <edge from-layer="2725" from-port="1" to-layer="2726" to-port="1" /> + <edge from-layer="2726" from-port="2" to-layer="2728" to-port="0" /> + <edge from-layer="2727" from-port="0" to-layer="2728" to-port="1" /> + <edge from-layer="2728" from-port="2" to-layer="2730" to-port="0" /> + <edge from-layer="2729" from-port="0" to-layer="2730" to-port="1" /> + <edge from-layer="2730" from-port="2" to-layer="2731" to-port="0" /> + <edge from-layer="2731" from-port="1" to-layer="2732" to-port="1" /> + <edge from-layer="2732" from-port="2" to-layer="2735" to-port="0" /> + <edge from-layer="2733" from-port="0" to-layer="2734" to-port="0" /> + <edge from-layer="2734" from-port="1" to-layer="2735" to-port="1" /> + <edge from-layer="2735" from-port="2" to-layer="2737" to-port="0" /> + <edge from-layer="2736" from-port="0" to-layer="2737" to-port="1" /> + <edge from-layer="2737" from-port="2" to-layer="2739" to-port="0" /> + <edge from-layer="2738" from-port="0" to-layer="2739" to-port="1" /> + <edge from-layer="2739" from-port="2" to-layer="2757" to-port="0" /> + <edge from-layer="2739" from-port="2" to-layer="2751" to-port="0" /> + <edge from-layer="2739" from-port="2" to-layer="2740" to-port="0" /> + <edge from-layer="2739" from-port="2" to-layer="2741" to-port="0" /> + <edge from-layer="2740" from-port="2" to-layer="2760" to-port="0" /> + <edge from-layer="2741" from-port="1" to-layer="2743" to-port="0" /> + <edge from-layer="2742" from-port="0" to-layer="2743" to-port="2" /> + <edge from-layer="2743" from-port="3" to-layer="2744" to-port="0" /> + <edge from-layer="2744" from-port="2" to-layer="2745" to-port="0" /> + <edge from-layer="2745" from-port="1" to-layer="2747" to-port="0" /> + <edge from-layer="2746" from-port="0" to-layer="2747" to-port="1" /> + <edge from-layer="2747" from-port="2" to-layer="2751" to-port="1" /> + <edge from-layer="2747" from-port="2" to-layer="2757" to-port="2" /> + <edge from-layer="2748" from-port="0" to-layer="2751" to-port="2" /> + <edge from-layer="2749" from-port="0" to-layer="2751" to-port="3" /> + <edge from-layer="2750" from-port="0" to-layer="2751" to-port="4" /> + <edge from-layer="2751" from-port="5" to-layer="2753" to-port="0" /> + <edge from-layer="2752" from-port="0" to-layer="2753" to-port="1" /> + <edge from-layer="2753" from-port="2" to-layer="2758" to-port="0" /> + <edge from-layer="2754" from-port="0" to-layer="2757" to-port="1" /> + <edge from-layer="2755" from-port="0" to-layer="2757" to-port="3" /> + <edge from-layer="2756" from-port="0" to-layer="2757" to-port="4" /> + <edge from-layer="2757" from-port="5" to-layer="2758" to-port="1" /> + <edge from-layer="2758" from-port="2" to-layer="2759" to-port="0" /> + <edge from-layer="2759" from-port="2" to-layer="2760" to-port="1" /> + <edge from-layer="2760" from-port="2" to-layer="2877" to-port="0" /> + <edge from-layer="2761" from-port="0" to-layer="2766" to-port="0" /> + <edge from-layer="2762" from-port="0" to-layer="2765" to-port="1" /> + <edge from-layer="2763" from-port="0" to-layer="2765" to-port="2" /> + <edge from-layer="2764" from-port="0" to-layer="2765" to-port="3" /> + <edge from-layer="2765" from-port="4" to-layer="2766" to-port="1" /> + <edge from-layer="2766" from-port="2" to-layer="2767" to-port="0" /> + <edge from-layer="2767" from-port="1" to-layer="2769" to-port="0" /> + <edge from-layer="2768" from-port="0" to-layer="2769" to-port="2" /> + <edge from-layer="2769" from-port="3" to-layer="2809" to-port="0" /> + <edge from-layer="2769" from-port="3" to-layer="2865" to-port="0" /> + <edge from-layer="2770" from-port="0" to-layer="2771" to-port="0" /> + <edge from-layer="2771" from-port="1" to-layer="2774" to-port="0" /> + <edge from-layer="2772" from-port="0" to-layer="2773" to-port="0" /> + <edge from-layer="2773" from-port="1" to-layer="2774" to-port="1" /> + <edge from-layer="2774" from-port="2" to-layer="2776" to-port="0" /> + <edge from-layer="2775" from-port="0" to-layer="2776" to-port="1" /> + <edge from-layer="2776" from-port="2" to-layer="2778" to-port="0" /> + <edge from-layer="2777" from-port="0" to-layer="2778" to-port="1" /> + <edge from-layer="2778" from-port="2" to-layer="2779" to-port="0" /> + <edge from-layer="2779" from-port="1" to-layer="2780" to-port="1" /> + <edge from-layer="2780" from-port="2" to-layer="2783" to-port="0" /> + <edge from-layer="2781" from-port="0" to-layer="2782" to-port="0" /> + <edge from-layer="2782" from-port="1" to-layer="2783" to-port="1" /> + <edge from-layer="2783" from-port="2" to-layer="2785" to-port="0" /> + <edge from-layer="2784" from-port="0" to-layer="2785" to-port="1" /> + <edge from-layer="2785" from-port="2" to-layer="2787" to-port="0" /> + <edge from-layer="2786" from-port="0" to-layer="2787" to-port="1" /> + <edge from-layer="2787" from-port="2" to-layer="2799" to-port="0" /> + <edge from-layer="2787" from-port="2" to-layer="2805" to-port="0" /> + <edge from-layer="2787" from-port="2" to-layer="2789" to-port="0" /> + <edge from-layer="2787" from-port="2" to-layer="2788" to-port="0" /> + <edge from-layer="2788" from-port="2" to-layer="2808" to-port="0" /> + <edge from-layer="2789" from-port="1" to-layer="2791" to-port="0" /> + <edge from-layer="2790" from-port="0" to-layer="2791" to-port="2" /> + <edge from-layer="2791" from-port="3" to-layer="2792" to-port="0" /> + <edge from-layer="2792" from-port="2" to-layer="2793" to-port="0" /> + <edge from-layer="2793" from-port="1" to-layer="2795" to-port="0" /> + <edge from-layer="2794" from-port="0" to-layer="2795" to-port="1" /> + <edge from-layer="2795" from-port="2" to-layer="2799" to-port="1" /> + <edge from-layer="2795" from-port="2" to-layer="2805" to-port="2" /> + <edge from-layer="2796" from-port="0" to-layer="2799" to-port="2" /> + <edge from-layer="2797" from-port="0" to-layer="2799" to-port="3" /> + <edge from-layer="2798" from-port="0" to-layer="2799" to-port="4" /> + <edge from-layer="2799" from-port="5" to-layer="2801" to-port="0" /> + <edge from-layer="2800" from-port="0" to-layer="2801" to-port="1" /> + <edge from-layer="2801" from-port="2" to-layer="2806" to-port="0" /> + <edge from-layer="2802" from-port="0" to-layer="2805" to-port="1" /> + <edge from-layer="2803" from-port="0" to-layer="2805" to-port="3" /> + <edge from-layer="2804" from-port="0" to-layer="2805" to-port="4" /> + <edge from-layer="2805" from-port="5" to-layer="2806" to-port="1" /> + <edge from-layer="2806" from-port="2" to-layer="2807" to-port="0" /> + <edge from-layer="2807" from-port="2" to-layer="2808" to-port="1" /> + <edge from-layer="2808" from-port="2" to-layer="2809" to-port="1" /> + <edge from-layer="2808" from-port="2" to-layer="2869" to-port="0" /> + <edge from-layer="2809" from-port="2" to-layer="2810" to-port="0" /> + <edge from-layer="2809" from-port="2" to-layer="11220" to-port="0" /> + <edge from-layer="2809" from-port="2" to-layer="2811" to-port="0" /> + <edge from-layer="2810" from-port="2" to-layer="2820" to-port="0" /> + <edge from-layer="2811" from-port="1" to-layer="2818" to-port="0" /> + <edge from-layer="2811" from-port="1" to-layer="2814" to-port="0" /> + <edge from-layer="2812" from-port="0" to-layer="2814" to-port="1" /> + <edge from-layer="2813" from-port="0" to-layer="2814" to-port="2" /> + <edge from-layer="2814" from-port="3" to-layer="2819" to-port="0" /> + <edge from-layer="2815" from-port="0" to-layer="2819" to-port="1" /> + <edge from-layer="2816" from-port="0" to-layer="2818" to-port="1" /> + <edge from-layer="2817" from-port="0" to-layer="2818" to-port="2" /> + <edge from-layer="2818" from-port="3" to-layer="2819" to-port="2" /> + <edge from-layer="2819" from-port="3" to-layer="2820" to-port="1" /> + <edge from-layer="2820" from-port="2" to-layer="2822" to-port="0" /> + <edge from-layer="2821" from-port="0" to-layer="2822" to-port="1" /> + <edge from-layer="2822" from-port="2" to-layer="2877" to-port="1" /> + <edge from-layer="2823" from-port="0" to-layer="2828" to-port="0" /> + <edge from-layer="2824" from-port="0" to-layer="2827" to-port="1" /> + <edge from-layer="2825" from-port="0" to-layer="2827" to-port="2" /> + <edge from-layer="2826" from-port="0" to-layer="2827" to-port="3" /> + <edge from-layer="2827" from-port="4" to-layer="2828" to-port="1" /> + <edge from-layer="2828" from-port="2" to-layer="2829" to-port="0" /> + <edge from-layer="2829" from-port="1" to-layer="2831" to-port="0" /> + <edge from-layer="2830" from-port="0" to-layer="2831" to-port="2" /> + <edge from-layer="2831" from-port="3" to-layer="2850" to-port="0" /> + <edge from-layer="2832" from-port="0" to-layer="2833" to-port="0" /> + <edge from-layer="2833" from-port="1" to-layer="2836" to-port="0" /> + <edge from-layer="2834" from-port="0" to-layer="2835" to-port="0" /> + <edge from-layer="2835" from-port="1" to-layer="2836" to-port="1" /> + <edge from-layer="2836" from-port="2" to-layer="2838" to-port="0" /> + <edge from-layer="2837" from-port="0" to-layer="2838" to-port="1" /> + <edge from-layer="2838" from-port="2" to-layer="2840" to-port="0" /> + <edge from-layer="2839" from-port="0" to-layer="2840" to-port="1" /> + <edge from-layer="2840" from-port="2" to-layer="2841" to-port="0" /> + <edge from-layer="2841" from-port="1" to-layer="2842" to-port="1" /> + <edge from-layer="2842" from-port="2" to-layer="2845" to-port="0" /> + <edge from-layer="2843" from-port="0" to-layer="2844" to-port="0" /> + <edge from-layer="2844" from-port="1" to-layer="2845" to-port="1" /> + <edge from-layer="2845" from-port="2" to-layer="2847" to-port="0" /> + <edge from-layer="2846" from-port="0" to-layer="2847" to-port="1" /> + <edge from-layer="2847" from-port="2" to-layer="2849" to-port="0" /> + <edge from-layer="2848" from-port="0" to-layer="2849" to-port="1" /> + <edge from-layer="2849" from-port="2" to-layer="2850" to-port="1" /> + <edge from-layer="2850" from-port="2" to-layer="2851" to-port="0" /> + <edge from-layer="2850" from-port="2" to-layer="11219" to-port="0" /> + <edge from-layer="2850" from-port="2" to-layer="2852" to-port="0" /> + <edge from-layer="2851" from-port="2" to-layer="2861" to-port="0" /> + <edge from-layer="2852" from-port="1" to-layer="2855" to-port="0" /> + <edge from-layer="2852" from-port="1" to-layer="2859" to-port="0" /> + <edge from-layer="2853" from-port="0" to-layer="2855" to-port="1" /> + <edge from-layer="2854" from-port="0" to-layer="2855" to-port="2" /> + <edge from-layer="2855" from-port="3" to-layer="2860" to-port="1" /> + <edge from-layer="2856" from-port="0" to-layer="2860" to-port="2" /> + <edge from-layer="2857" from-port="0" to-layer="2859" to-port="1" /> + <edge from-layer="2858" from-port="0" to-layer="2859" to-port="2" /> + <edge from-layer="2859" from-port="3" to-layer="2860" to-port="3" /> + <edge from-layer="2860" from-port="4" to-layer="2861" to-port="1" /> + <edge from-layer="2861" from-port="2" to-layer="2863" to-port="0" /> + <edge from-layer="2862" from-port="0" to-layer="2863" to-port="1" /> + <edge from-layer="2863" from-port="2" to-layer="2877" to-port="2" /> + <edge from-layer="2864" from-port="0" to-layer="2876" to-port="1" /> + <edge from-layer="2865" from-port="1" to-layer="2868" to-port="0" /> + <edge from-layer="2866" from-port="0" to-layer="2868" to-port="1" /> + <edge from-layer="2867" from-port="0" to-layer="2868" to-port="2" /> + <edge from-layer="2868" from-port="3" to-layer="2873" to-port="0" /> + <edge from-layer="2869" from-port="1" to-layer="2872" to-port="0" /> + <edge from-layer="2870" from-port="0" to-layer="2872" to-port="1" /> + <edge from-layer="2871" from-port="0" to-layer="2872" to-port="2" /> + <edge from-layer="2872" from-port="3" to-layer="2873" to-port="1" /> + <edge from-layer="2873" from-port="2" to-layer="2876" to-port="2" /> + <edge from-layer="2874" from-port="0" to-layer="2876" to-port="3" /> + <edge from-layer="2875" from-port="0" to-layer="2876" to-port="4" /> + <edge from-layer="2876" from-port="5" to-layer="2877" to-port="3" /> + <edge from-layer="2877" from-port="4" to-layer="2879" to-port="0" /> + <edge from-layer="2878" from-port="0" to-layer="2879" to-port="1" /> + <edge from-layer="2879" from-port="2" to-layer="2881" to-port="0" /> + <edge from-layer="2880" from-port="0" to-layer="2881" to-port="1" /> + <edge from-layer="2881" from-port="2" to-layer="2892" to-port="0" /> + <edge from-layer="2882" from-port="0" to-layer="2883" to-port="0" /> + <edge from-layer="2883" from-port="1" to-layer="2886" to-port="0" /> + <edge from-layer="2884" from-port="0" to-layer="2885" to-port="0" /> + <edge from-layer="2885" from-port="1" to-layer="2886" to-port="1" /> + <edge from-layer="2886" from-port="2" to-layer="2888" to-port="0" /> + <edge from-layer="2887" from-port="0" to-layer="2888" to-port="1" /> + <edge from-layer="2888" from-port="2" to-layer="2890" to-port="0" /> + <edge from-layer="2889" from-port="0" to-layer="2890" to-port="1" /> + <edge from-layer="2890" from-port="2" to-layer="2891" to-port="0" /> + <edge from-layer="2891" from-port="1" to-layer="2892" to-port="1" /> + <edge from-layer="2892" from-port="2" to-layer="2893" to-port="1" /> + <edge from-layer="2893" from-port="2" to-layer="2941" to-port="0" /> + <edge from-layer="2893" from-port="2" to-layer="2897" to-port="0" /> + <edge from-layer="2893" from-port="2" to-layer="2904" to-port="0" /> + <edge from-layer="2894" from-port="0" to-layer="2905" to-port="0" /> + <edge from-layer="2895" from-port="0" to-layer="2903" to-port="0" /> + <edge from-layer="2896" from-port="0" to-layer="2897" to-port="1" /> + <edge from-layer="2897" from-port="2" to-layer="2899" to-port="0" /> + <edge from-layer="2898" from-port="0" to-layer="2899" to-port="1" /> + <edge from-layer="2899" from-port="2" to-layer="2901" to-port="0" /> + <edge from-layer="2900" from-port="0" to-layer="2901" to-port="1" /> + <edge from-layer="2901" from-port="2" to-layer="2902" to-port="0" /> + <edge from-layer="2902" from-port="1" to-layer="2903" to-port="1" /> + <edge from-layer="2903" from-port="2" to-layer="2904" to-port="1" /> + <edge from-layer="2904" from-port="2" to-layer="2905" to-port="1" /> + <edge from-layer="2905" from-port="2" to-layer="2928" to-port="0" /> + <edge from-layer="2905" from-port="2" to-layer="2916" to-port="0" /> + <edge from-layer="2906" from-port="0" to-layer="2907" to-port="0" /> + <edge from-layer="2907" from-port="1" to-layer="2910" to-port="0" /> + <edge from-layer="2908" from-port="0" to-layer="2909" to-port="0" /> + <edge from-layer="2909" from-port="1" to-layer="2910" to-port="1" /> + <edge from-layer="2910" from-port="2" to-layer="2912" to-port="0" /> + <edge from-layer="2911" from-port="0" to-layer="2912" to-port="1" /> + <edge from-layer="2912" from-port="2" to-layer="2914" to-port="0" /> + <edge from-layer="2913" from-port="0" to-layer="2914" to-port="1" /> + <edge from-layer="2914" from-port="2" to-layer="2915" to-port="0" /> + <edge from-layer="2915" from-port="1" to-layer="2916" to-port="1" /> + <edge from-layer="2916" from-port="2" to-layer="2917" to-port="0" /> + <edge from-layer="2917" from-port="1" to-layer="2929" to-port="0" /> + <edge from-layer="2918" from-port="0" to-layer="2919" to-port="0" /> + <edge from-layer="2919" from-port="1" to-layer="2922" to-port="0" /> + <edge from-layer="2920" from-port="0" to-layer="2921" to-port="0" /> + <edge from-layer="2921" from-port="1" to-layer="2922" to-port="1" /> + <edge from-layer="2922" from-port="2" to-layer="2924" to-port="0" /> + <edge from-layer="2923" from-port="0" to-layer="2924" to-port="1" /> + <edge from-layer="2924" from-port="2" to-layer="2926" to-port="0" /> + <edge from-layer="2925" from-port="0" to-layer="2926" to-port="1" /> + <edge from-layer="2926" from-port="2" to-layer="2927" to-port="0" /> + <edge from-layer="2927" from-port="1" to-layer="2928" to-port="1" /> + <edge from-layer="2928" from-port="2" to-layer="2929" to-port="1" /> + <edge from-layer="2929" from-port="2" to-layer="2940" to-port="0" /> + <edge from-layer="2930" from-port="0" to-layer="2931" to-port="0" /> + <edge from-layer="2931" from-port="1" to-layer="2934" to-port="0" /> + <edge from-layer="2932" from-port="0" to-layer="2933" to-port="0" /> + <edge from-layer="2933" from-port="1" to-layer="2934" to-port="1" /> + <edge from-layer="2934" from-port="2" to-layer="2936" to-port="0" /> + <edge from-layer="2935" from-port="0" to-layer="2936" to-port="1" /> + <edge from-layer="2936" from-port="2" to-layer="2938" to-port="0" /> + <edge from-layer="2937" from-port="0" to-layer="2938" to-port="1" /> + <edge from-layer="2938" from-port="2" to-layer="2939" to-port="0" /> + <edge from-layer="2939" from-port="1" to-layer="2940" to-port="1" /> + <edge from-layer="2940" from-port="2" to-layer="2941" to-port="1" /> + <edge from-layer="2941" from-port="2" to-layer="2945" to-port="0" /> + <edge from-layer="2941" from-port="2" to-layer="3125" to-port="0" /> + <edge from-layer="2941" from-port="2" to-layer="2952" to-port="0" /> + <edge from-layer="2942" from-port="0" to-layer="2953" to-port="0" /> + <edge from-layer="2943" from-port="0" to-layer="2951" to-port="0" /> + <edge from-layer="2944" from-port="0" to-layer="2945" to-port="1" /> + <edge from-layer="2945" from-port="2" to-layer="2947" to-port="0" /> + <edge from-layer="2946" from-port="0" to-layer="2947" to-port="1" /> + <edge from-layer="2947" from-port="2" to-layer="2949" to-port="0" /> + <edge from-layer="2948" from-port="0" to-layer="2949" to-port="1" /> + <edge from-layer="2949" from-port="2" to-layer="2950" to-port="0" /> + <edge from-layer="2950" from-port="1" to-layer="2951" to-port="1" /> + <edge from-layer="2951" from-port="2" to-layer="2952" to-port="1" /> + <edge from-layer="2952" from-port="2" to-layer="2953" to-port="1" /> + <edge from-layer="2953" from-port="2" to-layer="3012" to-port="0" /> + <edge from-layer="2953" from-port="2" to-layer="3074" to-port="0" /> + <edge from-layer="2953" from-port="2" to-layer="2964" to-port="0" /> + <edge from-layer="2954" from-port="0" to-layer="2955" to-port="0" /> + <edge from-layer="2955" from-port="1" to-layer="2958" to-port="0" /> + <edge from-layer="2956" from-port="0" to-layer="2957" to-port="0" /> + <edge from-layer="2957" from-port="1" to-layer="2958" to-port="1" /> + <edge from-layer="2958" from-port="2" to-layer="2960" to-port="0" /> + <edge from-layer="2959" from-port="0" to-layer="2960" to-port="1" /> + <edge from-layer="2960" from-port="2" to-layer="2962" to-port="0" /> + <edge from-layer="2961" from-port="0" to-layer="2962" to-port="1" /> + <edge from-layer="2962" from-port="2" to-layer="2963" to-port="0" /> + <edge from-layer="2963" from-port="1" to-layer="2964" to-port="1" /> + <edge from-layer="2964" from-port="2" to-layer="2967" to-port="0" /> + <edge from-layer="2965" from-port="0" to-layer="2966" to-port="0" /> + <edge from-layer="2966" from-port="1" to-layer="2967" to-port="1" /> + <edge from-layer="2967" from-port="2" to-layer="2969" to-port="0" /> + <edge from-layer="2968" from-port="0" to-layer="2969" to-port="1" /> + <edge from-layer="2969" from-port="2" to-layer="2971" to-port="0" /> + <edge from-layer="2970" from-port="0" to-layer="2971" to-port="1" /> + <edge from-layer="2971" from-port="2" to-layer="2972" to-port="0" /> + <edge from-layer="2971" from-port="2" to-layer="2973" to-port="0" /> + <edge from-layer="2971" from-port="2" to-layer="2989" to-port="0" /> + <edge from-layer="2971" from-port="2" to-layer="2983" to-port="0" /> + <edge from-layer="2972" from-port="2" to-layer="2992" to-port="0" /> + <edge from-layer="2973" from-port="1" to-layer="2975" to-port="0" /> + <edge from-layer="2974" from-port="0" to-layer="2975" to-port="2" /> + <edge from-layer="2975" from-port="3" to-layer="2976" to-port="0" /> + <edge from-layer="2976" from-port="2" to-layer="2977" to-port="0" /> + <edge from-layer="2977" from-port="1" to-layer="2979" to-port="0" /> + <edge from-layer="2978" from-port="0" to-layer="2979" to-port="1" /> + <edge from-layer="2979" from-port="2" to-layer="2983" to-port="1" /> + <edge from-layer="2979" from-port="2" to-layer="2989" to-port="2" /> + <edge from-layer="2980" from-port="0" to-layer="2983" to-port="2" /> + <edge from-layer="2981" from-port="0" to-layer="2983" to-port="3" /> + <edge from-layer="2982" from-port="0" to-layer="2983" to-port="4" /> + <edge from-layer="2983" from-port="5" to-layer="2985" to-port="0" /> + <edge from-layer="2984" from-port="0" to-layer="2985" to-port="1" /> + <edge from-layer="2985" from-port="2" to-layer="2990" to-port="0" /> + <edge from-layer="2986" from-port="0" to-layer="2989" to-port="1" /> + <edge from-layer="2987" from-port="0" to-layer="2989" to-port="3" /> + <edge from-layer="2988" from-port="0" to-layer="2989" to-port="4" /> + <edge from-layer="2989" from-port="5" to-layer="2990" to-port="1" /> + <edge from-layer="2990" from-port="2" to-layer="2991" to-port="0" /> + <edge from-layer="2991" from-port="2" to-layer="2992" to-port="1" /> + <edge from-layer="2992" from-port="2" to-layer="3109" to-port="0" /> + <edge from-layer="2993" from-port="0" to-layer="2998" to-port="0" /> + <edge from-layer="2994" from-port="0" to-layer="2997" to-port="1" /> + <edge from-layer="2995" from-port="0" to-layer="2997" to-port="2" /> + <edge from-layer="2996" from-port="0" to-layer="2997" to-port="3" /> + <edge from-layer="2997" from-port="4" to-layer="2998" to-port="1" /> + <edge from-layer="2998" from-port="2" to-layer="2999" to-port="0" /> + <edge from-layer="2999" from-port="1" to-layer="3001" to-port="0" /> + <edge from-layer="3000" from-port="0" to-layer="3001" to-port="2" /> + <edge from-layer="3001" from-port="3" to-layer="3097" to-port="0" /> + <edge from-layer="3001" from-port="3" to-layer="3041" to-port="0" /> + <edge from-layer="3002" from-port="0" to-layer="3003" to-port="0" /> + <edge from-layer="3003" from-port="1" to-layer="3006" to-port="0" /> + <edge from-layer="3004" from-port="0" to-layer="3005" to-port="0" /> + <edge from-layer="3005" from-port="1" to-layer="3006" to-port="1" /> + <edge from-layer="3006" from-port="2" to-layer="3008" to-port="0" /> + <edge from-layer="3007" from-port="0" to-layer="3008" to-port="1" /> + <edge from-layer="3008" from-port="2" to-layer="3010" to-port="0" /> + <edge from-layer="3009" from-port="0" to-layer="3010" to-port="1" /> + <edge from-layer="3010" from-port="2" to-layer="3011" to-port="0" /> + <edge from-layer="3011" from-port="1" to-layer="3012" to-port="1" /> + <edge from-layer="3012" from-port="2" to-layer="3015" to-port="0" /> + <edge from-layer="3013" from-port="0" to-layer="3014" to-port="0" /> + <edge from-layer="3014" from-port="1" to-layer="3015" to-port="1" /> + <edge from-layer="3015" from-port="2" to-layer="3017" to-port="0" /> + <edge from-layer="3016" from-port="0" to-layer="3017" to-port="1" /> + <edge from-layer="3017" from-port="2" to-layer="3019" to-port="0" /> + <edge from-layer="3018" from-port="0" to-layer="3019" to-port="1" /> + <edge from-layer="3019" from-port="2" to-layer="3031" to-port="0" /> + <edge from-layer="3019" from-port="2" to-layer="3021" to-port="0" /> + <edge from-layer="3019" from-port="2" to-layer="3020" to-port="0" /> + <edge from-layer="3019" from-port="2" to-layer="3037" to-port="0" /> + <edge from-layer="3020" from-port="2" to-layer="3040" to-port="0" /> + <edge from-layer="3021" from-port="1" to-layer="3023" to-port="0" /> + <edge from-layer="3022" from-port="0" to-layer="3023" to-port="2" /> + <edge from-layer="3023" from-port="3" to-layer="3024" to-port="0" /> + <edge from-layer="3024" from-port="2" to-layer="3025" to-port="0" /> + <edge from-layer="3025" from-port="1" to-layer="3027" to-port="0" /> + <edge from-layer="3026" from-port="0" to-layer="3027" to-port="1" /> + <edge from-layer="3027" from-port="2" to-layer="3037" to-port="2" /> + <edge from-layer="3027" from-port="2" to-layer="3031" to-port="1" /> + <edge from-layer="3028" from-port="0" to-layer="3031" to-port="2" /> + <edge from-layer="3029" from-port="0" to-layer="3031" to-port="3" /> + <edge from-layer="3030" from-port="0" to-layer="3031" to-port="4" /> + <edge from-layer="3031" from-port="5" to-layer="3033" to-port="0" /> + <edge from-layer="3032" from-port="0" to-layer="3033" to-port="1" /> + <edge from-layer="3033" from-port="2" to-layer="3038" to-port="0" /> + <edge from-layer="3034" from-port="0" to-layer="3037" to-port="1" /> + <edge from-layer="3035" from-port="0" to-layer="3037" to-port="3" /> + <edge from-layer="3036" from-port="0" to-layer="3037" to-port="4" /> + <edge from-layer="3037" from-port="5" to-layer="3038" to-port="1" /> + <edge from-layer="3038" from-port="2" to-layer="3039" to-port="0" /> + <edge from-layer="3039" from-port="2" to-layer="3040" to-port="1" /> + <edge from-layer="3040" from-port="2" to-layer="3101" to-port="0" /> + <edge from-layer="3040" from-port="2" to-layer="3041" to-port="1" /> + <edge from-layer="3041" from-port="2" to-layer="3043" to-port="0" /> + <edge from-layer="3041" from-port="2" to-layer="3042" to-port="0" /> + <edge from-layer="3041" from-port="2" to-layer="11218" to-port="0" /> + <edge from-layer="3042" from-port="2" to-layer="3052" to-port="0" /> + <edge from-layer="3043" from-port="1" to-layer="3046" to-port="0" /> + <edge from-layer="3043" from-port="1" to-layer="3050" to-port="0" /> + <edge from-layer="3044" from-port="0" to-layer="3046" to-port="1" /> + <edge from-layer="3045" from-port="0" to-layer="3046" to-port="2" /> + <edge from-layer="3046" from-port="3" to-layer="3051" to-port="0" /> + <edge from-layer="3047" from-port="0" to-layer="3051" to-port="1" /> + <edge from-layer="3048" from-port="0" to-layer="3050" to-port="1" /> + <edge from-layer="3049" from-port="0" to-layer="3050" to-port="2" /> + <edge from-layer="3050" from-port="3" to-layer="3051" to-port="2" /> + <edge from-layer="3051" from-port="3" to-layer="3052" to-port="1" /> + <edge from-layer="3052" from-port="2" to-layer="3054" to-port="0" /> + <edge from-layer="3053" from-port="0" to-layer="3054" to-port="1" /> + <edge from-layer="3054" from-port="2" to-layer="3109" to-port="1" /> + <edge from-layer="3055" from-port="0" to-layer="3060" to-port="0" /> + <edge from-layer="3056" from-port="0" to-layer="3059" to-port="1" /> + <edge from-layer="3057" from-port="0" to-layer="3059" to-port="2" /> + <edge from-layer="3058" from-port="0" to-layer="3059" to-port="3" /> + <edge from-layer="3059" from-port="4" to-layer="3060" to-port="1" /> + <edge from-layer="3060" from-port="2" to-layer="3061" to-port="0" /> + <edge from-layer="3061" from-port="1" to-layer="3063" to-port="0" /> + <edge from-layer="3062" from-port="0" to-layer="3063" to-port="2" /> + <edge from-layer="3063" from-port="3" to-layer="3082" to-port="0" /> + <edge from-layer="3064" from-port="0" to-layer="3065" to-port="0" /> + <edge from-layer="3065" from-port="1" to-layer="3068" to-port="0" /> + <edge from-layer="3066" from-port="0" to-layer="3067" to-port="0" /> + <edge from-layer="3067" from-port="1" to-layer="3068" to-port="1" /> + <edge from-layer="3068" from-port="2" to-layer="3070" to-port="0" /> + <edge from-layer="3069" from-port="0" to-layer="3070" to-port="1" /> + <edge from-layer="3070" from-port="2" to-layer="3072" to-port="0" /> + <edge from-layer="3071" from-port="0" to-layer="3072" to-port="1" /> + <edge from-layer="3072" from-port="2" to-layer="3073" to-port="0" /> + <edge from-layer="3073" from-port="1" to-layer="3074" to-port="1" /> + <edge from-layer="3074" from-port="2" to-layer="3077" to-port="0" /> + <edge from-layer="3075" from-port="0" to-layer="3076" to-port="0" /> + <edge from-layer="3076" from-port="1" to-layer="3077" to-port="1" /> + <edge from-layer="3077" from-port="2" to-layer="3079" to-port="0" /> + <edge from-layer="3078" from-port="0" to-layer="3079" to-port="1" /> + <edge from-layer="3079" from-port="2" to-layer="3081" to-port="0" /> + <edge from-layer="3080" from-port="0" to-layer="3081" to-port="1" /> + <edge from-layer="3081" from-port="2" to-layer="3082" to-port="1" /> + <edge from-layer="3082" from-port="2" to-layer="3083" to-port="0" /> + <edge from-layer="3082" from-port="2" to-layer="3084" to-port="0" /> + <edge from-layer="3082" from-port="2" to-layer="11217" to-port="0" /> + <edge from-layer="3083" from-port="2" to-layer="3093" to-port="0" /> + <edge from-layer="3084" from-port="1" to-layer="3087" to-port="0" /> + <edge from-layer="3084" from-port="1" to-layer="3091" to-port="0" /> + <edge from-layer="3085" from-port="0" to-layer="3087" to-port="1" /> + <edge from-layer="3086" from-port="0" to-layer="3087" to-port="2" /> + <edge from-layer="3087" from-port="3" to-layer="3092" to-port="1" /> + <edge from-layer="3088" from-port="0" to-layer="3092" to-port="2" /> + <edge from-layer="3089" from-port="0" to-layer="3091" to-port="1" /> + <edge from-layer="3090" from-port="0" to-layer="3091" to-port="2" /> + <edge from-layer="3091" from-port="3" to-layer="3092" to-port="3" /> + <edge from-layer="3092" from-port="4" to-layer="3093" to-port="1" /> + <edge from-layer="3093" from-port="2" to-layer="3095" to-port="0" /> + <edge from-layer="3094" from-port="0" to-layer="3095" to-port="1" /> + <edge from-layer="3095" from-port="2" to-layer="3109" to-port="2" /> + <edge from-layer="3096" from-port="0" to-layer="3108" to-port="1" /> + <edge from-layer="3097" from-port="1" to-layer="3100" to-port="0" /> + <edge from-layer="3098" from-port="0" to-layer="3100" to-port="1" /> + <edge from-layer="3099" from-port="0" to-layer="3100" to-port="2" /> + <edge from-layer="3100" from-port="3" to-layer="3105" to-port="0" /> + <edge from-layer="3101" from-port="1" to-layer="3104" to-port="0" /> + <edge from-layer="3102" from-port="0" to-layer="3104" to-port="1" /> + <edge from-layer="3103" from-port="0" to-layer="3104" to-port="2" /> + <edge from-layer="3104" from-port="3" to-layer="3105" to-port="1" /> + <edge from-layer="3105" from-port="2" to-layer="3108" to-port="2" /> + <edge from-layer="3106" from-port="0" to-layer="3108" to-port="3" /> + <edge from-layer="3107" from-port="0" to-layer="3108" to-port="4" /> + <edge from-layer="3108" from-port="5" to-layer="3109" to-port="3" /> + <edge from-layer="3109" from-port="4" to-layer="3111" to-port="0" /> + <edge from-layer="3110" from-port="0" to-layer="3111" to-port="1" /> + <edge from-layer="3111" from-port="2" to-layer="3113" to-port="0" /> + <edge from-layer="3112" from-port="0" to-layer="3113" to-port="1" /> + <edge from-layer="3113" from-port="2" to-layer="3124" to-port="0" /> + <edge from-layer="3114" from-port="0" to-layer="3115" to-port="0" /> + <edge from-layer="3115" from-port="1" to-layer="3118" to-port="0" /> + <edge from-layer="3116" from-port="0" to-layer="3117" to-port="0" /> + <edge from-layer="3117" from-port="1" to-layer="3118" to-port="1" /> + <edge from-layer="3118" from-port="2" to-layer="3120" to-port="0" /> + <edge from-layer="3119" from-port="0" to-layer="3120" to-port="1" /> + <edge from-layer="3120" from-port="2" to-layer="3122" to-port="0" /> + <edge from-layer="3121" from-port="0" to-layer="3122" to-port="1" /> + <edge from-layer="3122" from-port="2" to-layer="3123" to-port="0" /> + <edge from-layer="3123" from-port="1" to-layer="3124" to-port="1" /> + <edge from-layer="3124" from-port="2" to-layer="3125" to-port="1" /> + <edge from-layer="3125" from-port="2" to-layer="3173" to-port="0" /> + <edge from-layer="3125" from-port="2" to-layer="3129" to-port="0" /> + <edge from-layer="3125" from-port="2" to-layer="3136" to-port="0" /> + <edge from-layer="3126" from-port="0" to-layer="3137" to-port="0" /> + <edge from-layer="3127" from-port="0" to-layer="3135" to-port="0" /> + <edge from-layer="3128" from-port="0" to-layer="3129" to-port="1" /> + <edge from-layer="3129" from-port="2" to-layer="3131" to-port="0" /> + <edge from-layer="3130" from-port="0" to-layer="3131" to-port="1" /> + <edge from-layer="3131" from-port="2" to-layer="3133" to-port="0" /> + <edge from-layer="3132" from-port="0" to-layer="3133" to-port="1" /> + <edge from-layer="3133" from-port="2" to-layer="3134" to-port="0" /> + <edge from-layer="3134" from-port="1" to-layer="3135" to-port="1" /> + <edge from-layer="3135" from-port="2" to-layer="3136" to-port="1" /> + <edge from-layer="3136" from-port="2" to-layer="3137" to-port="1" /> + <edge from-layer="3137" from-port="2" to-layer="3160" to-port="0" /> + <edge from-layer="3137" from-port="2" to-layer="3148" to-port="0" /> + <edge from-layer="3138" from-port="0" to-layer="3139" to-port="0" /> + <edge from-layer="3139" from-port="1" to-layer="3142" to-port="0" /> + <edge from-layer="3140" from-port="0" to-layer="3141" to-port="0" /> + <edge from-layer="3141" from-port="1" to-layer="3142" to-port="1" /> + <edge from-layer="3142" from-port="2" to-layer="3144" to-port="0" /> + <edge from-layer="3143" from-port="0" to-layer="3144" to-port="1" /> + <edge from-layer="3144" from-port="2" to-layer="3146" to-port="0" /> + <edge from-layer="3145" from-port="0" to-layer="3146" to-port="1" /> + <edge from-layer="3146" from-port="2" to-layer="3147" to-port="0" /> + <edge from-layer="3147" from-port="1" to-layer="3148" to-port="1" /> + <edge from-layer="3148" from-port="2" to-layer="3149" to-port="0" /> + <edge from-layer="3149" from-port="1" to-layer="3161" to-port="0" /> + <edge from-layer="3150" from-port="0" to-layer="3151" to-port="0" /> + <edge from-layer="3151" from-port="1" to-layer="3154" to-port="0" /> + <edge from-layer="3152" from-port="0" to-layer="3153" to-port="0" /> + <edge from-layer="3153" from-port="1" to-layer="3154" to-port="1" /> + <edge from-layer="3154" from-port="2" to-layer="3156" to-port="0" /> + <edge from-layer="3155" from-port="0" to-layer="3156" to-port="1" /> + <edge from-layer="3156" from-port="2" to-layer="3158" to-port="0" /> + <edge from-layer="3157" from-port="0" to-layer="3158" to-port="1" /> + <edge from-layer="3158" from-port="2" to-layer="3159" to-port="0" /> + <edge from-layer="3159" from-port="1" to-layer="3160" to-port="1" /> + <edge from-layer="3160" from-port="2" to-layer="3161" to-port="1" /> + <edge from-layer="3161" from-port="2" to-layer="3172" to-port="0" /> + <edge from-layer="3162" from-port="0" to-layer="3163" to-port="0" /> + <edge from-layer="3163" from-port="1" to-layer="3166" to-port="0" /> + <edge from-layer="3164" from-port="0" to-layer="3165" to-port="0" /> + <edge from-layer="3165" from-port="1" to-layer="3166" to-port="1" /> + <edge from-layer="3166" from-port="2" to-layer="3168" to-port="0" /> + <edge from-layer="3167" from-port="0" to-layer="3168" to-port="1" /> + <edge from-layer="3168" from-port="2" to-layer="3170" to-port="0" /> + <edge from-layer="3169" from-port="0" to-layer="3170" to-port="1" /> + <edge from-layer="3170" from-port="2" to-layer="3171" to-port="0" /> + <edge from-layer="3171" from-port="1" to-layer="3172" to-port="1" /> + <edge from-layer="3172" from-port="2" to-layer="3173" to-port="1" /> + <edge from-layer="3173" from-port="2" to-layer="3357" to-port="0" /> + <edge from-layer="3173" from-port="2" to-layer="3184" to-port="0" /> + <edge from-layer="3173" from-port="2" to-layer="3177" to-port="0" /> + <edge from-layer="3174" from-port="0" to-layer="3185" to-port="0" /> + <edge from-layer="3175" from-port="0" to-layer="3183" to-port="0" /> + <edge from-layer="3176" from-port="0" to-layer="3177" to-port="1" /> + <edge from-layer="3177" from-port="2" to-layer="3179" to-port="0" /> + <edge from-layer="3178" from-port="0" to-layer="3179" to-port="1" /> + <edge from-layer="3179" from-port="2" to-layer="3181" to-port="0" /> + <edge from-layer="3180" from-port="0" to-layer="3181" to-port="1" /> + <edge from-layer="3181" from-port="2" to-layer="3182" to-port="0" /> + <edge from-layer="3182" from-port="1" to-layer="3183" to-port="1" /> + <edge from-layer="3183" from-port="2" to-layer="3184" to-port="1" /> + <edge from-layer="3184" from-port="2" to-layer="3185" to-port="1" /> + <edge from-layer="3185" from-port="2" to-layer="3196" to-port="0" /> + <edge from-layer="3185" from-port="2" to-layer="3244" to-port="0" /> + <edge from-layer="3185" from-port="2" to-layer="3306" to-port="0" /> + <edge from-layer="3186" from-port="0" to-layer="3187" to-port="0" /> + <edge from-layer="3187" from-port="1" to-layer="3190" to-port="0" /> + <edge from-layer="3188" from-port="0" to-layer="3189" to-port="0" /> + <edge from-layer="3189" from-port="1" to-layer="3190" to-port="1" /> + <edge from-layer="3190" from-port="2" to-layer="3192" to-port="0" /> + <edge from-layer="3191" from-port="0" to-layer="3192" to-port="1" /> + <edge from-layer="3192" from-port="2" to-layer="3194" to-port="0" /> + <edge from-layer="3193" from-port="0" to-layer="3194" to-port="1" /> + <edge from-layer="3194" from-port="2" to-layer="3195" to-port="0" /> + <edge from-layer="3195" from-port="1" to-layer="3196" to-port="1" /> + <edge from-layer="3196" from-port="2" to-layer="3199" to-port="0" /> + <edge from-layer="3197" from-port="0" to-layer="3198" to-port="0" /> + <edge from-layer="3198" from-port="1" to-layer="3199" to-port="1" /> + <edge from-layer="3199" from-port="2" to-layer="3201" to-port="0" /> + <edge from-layer="3200" from-port="0" to-layer="3201" to-port="1" /> + <edge from-layer="3201" from-port="2" to-layer="3203" to-port="0" /> + <edge from-layer="3202" from-port="0" to-layer="3203" to-port="1" /> + <edge from-layer="3203" from-port="2" to-layer="3215" to-port="0" /> + <edge from-layer="3203" from-port="2" to-layer="3221" to-port="0" /> + <edge from-layer="3203" from-port="2" to-layer="3205" to-port="0" /> + <edge from-layer="3203" from-port="2" to-layer="3204" to-port="0" /> + <edge from-layer="3204" from-port="2" to-layer="3224" to-port="0" /> + <edge from-layer="3205" from-port="1" to-layer="3207" to-port="0" /> + <edge from-layer="3206" from-port="0" to-layer="3207" to-port="2" /> + <edge from-layer="3207" from-port="3" to-layer="3208" to-port="0" /> + <edge from-layer="3208" from-port="2" to-layer="3209" to-port="0" /> + <edge from-layer="3209" from-port="1" to-layer="3211" to-port="0" /> + <edge from-layer="3210" from-port="0" to-layer="3211" to-port="1" /> + <edge from-layer="3211" from-port="2" to-layer="3215" to-port="1" /> + <edge from-layer="3211" from-port="2" to-layer="3221" to-port="2" /> + <edge from-layer="3212" from-port="0" to-layer="3215" to-port="2" /> + <edge from-layer="3213" from-port="0" to-layer="3215" to-port="3" /> + <edge from-layer="3214" from-port="0" to-layer="3215" to-port="4" /> + <edge from-layer="3215" from-port="5" to-layer="3217" to-port="0" /> + <edge from-layer="3216" from-port="0" to-layer="3217" to-port="1" /> + <edge from-layer="3217" from-port="2" to-layer="3222" to-port="0" /> + <edge from-layer="3218" from-port="0" to-layer="3221" to-port="1" /> + <edge from-layer="3219" from-port="0" to-layer="3221" to-port="3" /> + <edge from-layer="3220" from-port="0" to-layer="3221" to-port="4" /> + <edge from-layer="3221" from-port="5" to-layer="3222" to-port="1" /> + <edge from-layer="3222" from-port="2" to-layer="3223" to-port="0" /> + <edge from-layer="3223" from-port="2" to-layer="3224" to-port="1" /> + <edge from-layer="3224" from-port="2" to-layer="3341" to-port="0" /> + <edge from-layer="3225" from-port="0" to-layer="3230" to-port="0" /> + <edge from-layer="3226" from-port="0" to-layer="3229" to-port="1" /> + <edge from-layer="3227" from-port="0" to-layer="3229" to-port="2" /> + <edge from-layer="3228" from-port="0" to-layer="3229" to-port="3" /> + <edge from-layer="3229" from-port="4" to-layer="3230" to-port="1" /> + <edge from-layer="3230" from-port="2" to-layer="3231" to-port="0" /> + <edge from-layer="3231" from-port="1" to-layer="3233" to-port="0" /> + <edge from-layer="3232" from-port="0" to-layer="3233" to-port="2" /> + <edge from-layer="3233" from-port="3" to-layer="3273" to-port="0" /> + <edge from-layer="3233" from-port="3" to-layer="3329" to-port="0" /> + <edge from-layer="3234" from-port="0" to-layer="3235" to-port="0" /> + <edge from-layer="3235" from-port="1" to-layer="3238" to-port="0" /> + <edge from-layer="3236" from-port="0" to-layer="3237" to-port="0" /> + <edge from-layer="3237" from-port="1" to-layer="3238" to-port="1" /> + <edge from-layer="3238" from-port="2" to-layer="3240" to-port="0" /> + <edge from-layer="3239" from-port="0" to-layer="3240" to-port="1" /> + <edge from-layer="3240" from-port="2" to-layer="3242" to-port="0" /> + <edge from-layer="3241" from-port="0" to-layer="3242" to-port="1" /> + <edge from-layer="3242" from-port="2" to-layer="3243" to-port="0" /> + <edge from-layer="3243" from-port="1" to-layer="3244" to-port="1" /> + <edge from-layer="3244" from-port="2" to-layer="3247" to-port="0" /> + <edge from-layer="3245" from-port="0" to-layer="3246" to-port="0" /> + <edge from-layer="3246" from-port="1" to-layer="3247" to-port="1" /> + <edge from-layer="3247" from-port="2" to-layer="3249" to-port="0" /> + <edge from-layer="3248" from-port="0" to-layer="3249" to-port="1" /> + <edge from-layer="3249" from-port="2" to-layer="3251" to-port="0" /> + <edge from-layer="3250" from-port="0" to-layer="3251" to-port="1" /> + <edge from-layer="3251" from-port="2" to-layer="3252" to-port="0" /> + <edge from-layer="3251" from-port="2" to-layer="3253" to-port="0" /> + <edge from-layer="3251" from-port="2" to-layer="3269" to-port="0" /> + <edge from-layer="3251" from-port="2" to-layer="3263" to-port="0" /> + <edge from-layer="3252" from-port="2" to-layer="3272" to-port="0" /> + <edge from-layer="3253" from-port="1" to-layer="3255" to-port="0" /> + <edge from-layer="3254" from-port="0" to-layer="3255" to-port="2" /> + <edge from-layer="3255" from-port="3" to-layer="3256" to-port="0" /> + <edge from-layer="3256" from-port="2" to-layer="3257" to-port="0" /> + <edge from-layer="3257" from-port="1" to-layer="3259" to-port="0" /> + <edge from-layer="3258" from-port="0" to-layer="3259" to-port="1" /> + <edge from-layer="3259" from-port="2" to-layer="3263" to-port="1" /> + <edge from-layer="3259" from-port="2" to-layer="3269" to-port="2" /> + <edge from-layer="3260" from-port="0" to-layer="3263" to-port="2" /> + <edge from-layer="3261" from-port="0" to-layer="3263" to-port="3" /> + <edge from-layer="3262" from-port="0" to-layer="3263" to-port="4" /> + <edge from-layer="3263" from-port="5" to-layer="3265" to-port="0" /> + <edge from-layer="3264" from-port="0" to-layer="3265" to-port="1" /> + <edge from-layer="3265" from-port="2" to-layer="3270" to-port="0" /> + <edge from-layer="3266" from-port="0" to-layer="3269" to-port="1" /> + <edge from-layer="3267" from-port="0" to-layer="3269" to-port="3" /> + <edge from-layer="3268" from-port="0" to-layer="3269" to-port="4" /> + <edge from-layer="3269" from-port="5" to-layer="3270" to-port="1" /> + <edge from-layer="3270" from-port="2" to-layer="3271" to-port="0" /> + <edge from-layer="3271" from-port="2" to-layer="3272" to-port="1" /> + <edge from-layer="3272" from-port="2" to-layer="3333" to-port="0" /> + <edge from-layer="3272" from-port="2" to-layer="3273" to-port="1" /> + <edge from-layer="3273" from-port="2" to-layer="11216" to-port="0" /> + <edge from-layer="3273" from-port="2" to-layer="3274" to-port="0" /> + <edge from-layer="3273" from-port="2" to-layer="3275" to-port="0" /> + <edge from-layer="3274" from-port="2" to-layer="3284" to-port="0" /> + <edge from-layer="3275" from-port="1" to-layer="3282" to-port="0" /> + <edge from-layer="3275" from-port="1" to-layer="3278" to-port="0" /> + <edge from-layer="3276" from-port="0" to-layer="3278" to-port="1" /> + <edge from-layer="3277" from-port="0" to-layer="3278" to-port="2" /> + <edge from-layer="3278" from-port="3" to-layer="3283" to-port="0" /> + <edge from-layer="3279" from-port="0" to-layer="3283" to-port="1" /> + <edge from-layer="3280" from-port="0" to-layer="3282" to-port="1" /> + <edge from-layer="3281" from-port="0" to-layer="3282" to-port="2" /> + <edge from-layer="3282" from-port="3" to-layer="3283" to-port="2" /> + <edge from-layer="3283" from-port="3" to-layer="3284" to-port="1" /> + <edge from-layer="3284" from-port="2" to-layer="3286" to-port="0" /> + <edge from-layer="3285" from-port="0" to-layer="3286" to-port="1" /> + <edge from-layer="3286" from-port="2" to-layer="3341" to-port="1" /> + <edge from-layer="3287" from-port="0" to-layer="3292" to-port="0" /> + <edge from-layer="3288" from-port="0" to-layer="3291" to-port="1" /> + <edge from-layer="3289" from-port="0" to-layer="3291" to-port="2" /> + <edge from-layer="3290" from-port="0" to-layer="3291" to-port="3" /> + <edge from-layer="3291" from-port="4" to-layer="3292" to-port="1" /> + <edge from-layer="3292" from-port="2" to-layer="3293" to-port="0" /> + <edge from-layer="3293" from-port="1" to-layer="3295" to-port="0" /> + <edge from-layer="3294" from-port="0" to-layer="3295" to-port="2" /> + <edge from-layer="3295" from-port="3" to-layer="3314" to-port="0" /> + <edge from-layer="3296" from-port="0" to-layer="3297" to-port="0" /> + <edge from-layer="3297" from-port="1" to-layer="3300" to-port="0" /> + <edge from-layer="3298" from-port="0" to-layer="3299" to-port="0" /> + <edge from-layer="3299" from-port="1" to-layer="3300" to-port="1" /> + <edge from-layer="3300" from-port="2" to-layer="3302" to-port="0" /> + <edge from-layer="3301" from-port="0" to-layer="3302" to-port="1" /> + <edge from-layer="3302" from-port="2" to-layer="3304" to-port="0" /> + <edge from-layer="3303" from-port="0" to-layer="3304" to-port="1" /> + <edge from-layer="3304" from-port="2" to-layer="3305" to-port="0" /> + <edge from-layer="3305" from-port="1" to-layer="3306" to-port="1" /> + <edge from-layer="3306" from-port="2" to-layer="3309" to-port="0" /> + <edge from-layer="3307" from-port="0" to-layer="3308" to-port="0" /> + <edge from-layer="3308" from-port="1" to-layer="3309" to-port="1" /> + <edge from-layer="3309" from-port="2" to-layer="3311" to-port="0" /> + <edge from-layer="3310" from-port="0" to-layer="3311" to-port="1" /> + <edge from-layer="3311" from-port="2" to-layer="3313" to-port="0" /> + <edge from-layer="3312" from-port="0" to-layer="3313" to-port="1" /> + <edge from-layer="3313" from-port="2" to-layer="3314" to-port="1" /> + <edge from-layer="3314" from-port="2" to-layer="3315" to-port="0" /> + <edge from-layer="3314" from-port="2" to-layer="3316" to-port="0" /> + <edge from-layer="3314" from-port="2" to-layer="11215" to-port="0" /> + <edge from-layer="3315" from-port="2" to-layer="3325" to-port="0" /> + <edge from-layer="3316" from-port="1" to-layer="3319" to-port="0" /> + <edge from-layer="3316" from-port="1" to-layer="3323" to-port="0" /> + <edge from-layer="3317" from-port="0" to-layer="3319" to-port="1" /> + <edge from-layer="3318" from-port="0" to-layer="3319" to-port="2" /> + <edge from-layer="3319" from-port="3" to-layer="3324" to-port="1" /> + <edge from-layer="3320" from-port="0" to-layer="3324" to-port="2" /> + <edge from-layer="3321" from-port="0" to-layer="3323" to-port="1" /> + <edge from-layer="3322" from-port="0" to-layer="3323" to-port="2" /> + <edge from-layer="3323" from-port="3" to-layer="3324" to-port="3" /> + <edge from-layer="3324" from-port="4" to-layer="3325" to-port="1" /> + <edge from-layer="3325" from-port="2" to-layer="3327" to-port="0" /> + <edge from-layer="3326" from-port="0" to-layer="3327" to-port="1" /> + <edge from-layer="3327" from-port="2" to-layer="3341" to-port="2" /> + <edge from-layer="3328" from-port="0" to-layer="3340" to-port="1" /> + <edge from-layer="3329" from-port="1" to-layer="3332" to-port="0" /> + <edge from-layer="3330" from-port="0" to-layer="3332" to-port="1" /> + <edge from-layer="3331" from-port="0" to-layer="3332" to-port="2" /> + <edge from-layer="3332" from-port="3" to-layer="3337" to-port="0" /> + <edge from-layer="3333" from-port="1" to-layer="3336" to-port="0" /> + <edge from-layer="3334" from-port="0" to-layer="3336" to-port="1" /> + <edge from-layer="3335" from-port="0" to-layer="3336" to-port="2" /> + <edge from-layer="3336" from-port="3" to-layer="3337" to-port="1" /> + <edge from-layer="3337" from-port="2" to-layer="3340" to-port="2" /> + <edge from-layer="3338" from-port="0" to-layer="3340" to-port="3" /> + <edge from-layer="3339" from-port="0" to-layer="3340" to-port="4" /> + <edge from-layer="3340" from-port="5" to-layer="3341" to-port="3" /> + <edge from-layer="3341" from-port="4" to-layer="3343" to-port="0" /> + <edge from-layer="3342" from-port="0" to-layer="3343" to-port="1" /> + <edge from-layer="3343" from-port="2" to-layer="3345" to-port="0" /> + <edge from-layer="3344" from-port="0" to-layer="3345" to-port="1" /> + <edge from-layer="3345" from-port="2" to-layer="3356" to-port="0" /> + <edge from-layer="3346" from-port="0" to-layer="3347" to-port="0" /> + <edge from-layer="3347" from-port="1" to-layer="3350" to-port="0" /> + <edge from-layer="3348" from-port="0" to-layer="3349" to-port="0" /> + <edge from-layer="3349" from-port="1" to-layer="3350" to-port="1" /> + <edge from-layer="3350" from-port="2" to-layer="3352" to-port="0" /> + <edge from-layer="3351" from-port="0" to-layer="3352" to-port="1" /> + <edge from-layer="3352" from-port="2" to-layer="3354" to-port="0" /> + <edge from-layer="3353" from-port="0" to-layer="3354" to-port="1" /> + <edge from-layer="3354" from-port="2" to-layer="3355" to-port="0" /> + <edge from-layer="3355" from-port="1" to-layer="3356" to-port="1" /> + <edge from-layer="3356" from-port="2" to-layer="3357" to-port="1" /> + <edge from-layer="3357" from-port="2" to-layer="3368" to-port="0" /> + <edge from-layer="3357" from-port="2" to-layer="3361" to-port="0" /> + <edge from-layer="3357" from-port="2" to-layer="3405" to-port="0" /> + <edge from-layer="3358" from-port="0" to-layer="3369" to-port="0" /> + <edge from-layer="3359" from-port="0" to-layer="3367" to-port="0" /> + <edge from-layer="3360" from-port="0" to-layer="3361" to-port="1" /> + <edge from-layer="3361" from-port="2" to-layer="3363" to-port="0" /> + <edge from-layer="3362" from-port="0" to-layer="3363" to-port="1" /> + <edge from-layer="3363" from-port="2" to-layer="3365" to-port="0" /> + <edge from-layer="3364" from-port="0" to-layer="3365" to-port="1" /> + <edge from-layer="3365" from-port="2" to-layer="3366" to-port="0" /> + <edge from-layer="3366" from-port="1" to-layer="3367" to-port="1" /> + <edge from-layer="3367" from-port="2" to-layer="3368" to-port="1" /> + <edge from-layer="3368" from-port="2" to-layer="3369" to-port="1" /> + <edge from-layer="3369" from-port="2" to-layer="3392" to-port="0" /> + <edge from-layer="3369" from-port="2" to-layer="3380" to-port="0" /> + <edge from-layer="3370" from-port="0" to-layer="3371" to-port="0" /> + <edge from-layer="3371" from-port="1" to-layer="3374" to-port="0" /> + <edge from-layer="3372" from-port="0" to-layer="3373" to-port="0" /> + <edge from-layer="3373" from-port="1" to-layer="3374" to-port="1" /> + <edge from-layer="3374" from-port="2" to-layer="3376" to-port="0" /> + <edge from-layer="3375" from-port="0" to-layer="3376" to-port="1" /> + <edge from-layer="3376" from-port="2" to-layer="3378" to-port="0" /> + <edge from-layer="3377" from-port="0" to-layer="3378" to-port="1" /> + <edge from-layer="3378" from-port="2" to-layer="3379" to-port="0" /> + <edge from-layer="3379" from-port="1" to-layer="3380" to-port="1" /> + <edge from-layer="3380" from-port="2" to-layer="3381" to-port="0" /> + <edge from-layer="3381" from-port="1" to-layer="3393" to-port="0" /> + <edge from-layer="3382" from-port="0" to-layer="3383" to-port="0" /> + <edge from-layer="3383" from-port="1" to-layer="3386" to-port="0" /> + <edge from-layer="3384" from-port="0" to-layer="3385" to-port="0" /> + <edge from-layer="3385" from-port="1" to-layer="3386" to-port="1" /> + <edge from-layer="3386" from-port="2" to-layer="3388" to-port="0" /> + <edge from-layer="3387" from-port="0" to-layer="3388" to-port="1" /> + <edge from-layer="3388" from-port="2" to-layer="3390" to-port="0" /> + <edge from-layer="3389" from-port="0" to-layer="3390" to-port="1" /> + <edge from-layer="3390" from-port="2" to-layer="3391" to-port="0" /> + <edge from-layer="3391" from-port="1" to-layer="3392" to-port="1" /> + <edge from-layer="3392" from-port="2" to-layer="3393" to-port="1" /> + <edge from-layer="3393" from-port="2" to-layer="3404" to-port="0" /> + <edge from-layer="3394" from-port="0" to-layer="3395" to-port="0" /> + <edge from-layer="3395" from-port="1" to-layer="3398" to-port="0" /> + <edge from-layer="3396" from-port="0" to-layer="3397" to-port="0" /> + <edge from-layer="3397" from-port="1" to-layer="3398" to-port="1" /> + <edge from-layer="3398" from-port="2" to-layer="3400" to-port="0" /> + <edge from-layer="3399" from-port="0" to-layer="3400" to-port="1" /> + <edge from-layer="3400" from-port="2" to-layer="3402" to-port="0" /> + <edge from-layer="3401" from-port="0" to-layer="3402" to-port="1" /> + <edge from-layer="3402" from-port="2" to-layer="3403" to-port="0" /> + <edge from-layer="3403" from-port="1" to-layer="3404" to-port="1" /> + <edge from-layer="3404" from-port="2" to-layer="3405" to-port="1" /> + <edge from-layer="3405" from-port="2" to-layer="3589" to-port="0" /> + <edge from-layer="3405" from-port="2" to-layer="3416" to-port="0" /> + <edge from-layer="3405" from-port="2" to-layer="3409" to-port="0" /> + <edge from-layer="3406" from-port="0" to-layer="3417" to-port="0" /> + <edge from-layer="3407" from-port="0" to-layer="3415" to-port="0" /> + <edge from-layer="3408" from-port="0" to-layer="3409" to-port="1" /> + <edge from-layer="3409" from-port="2" to-layer="3411" to-port="0" /> + <edge from-layer="3410" from-port="0" to-layer="3411" to-port="1" /> + <edge from-layer="3411" from-port="2" to-layer="3413" to-port="0" /> + <edge from-layer="3412" from-port="0" to-layer="3413" to-port="1" /> + <edge from-layer="3413" from-port="2" to-layer="3414" to-port="0" /> + <edge from-layer="3414" from-port="1" to-layer="3415" to-port="1" /> + <edge from-layer="3415" from-port="2" to-layer="3416" to-port="1" /> + <edge from-layer="3416" from-port="2" to-layer="3417" to-port="1" /> + <edge from-layer="3417" from-port="2" to-layer="3538" to-port="0" /> + <edge from-layer="3417" from-port="2" to-layer="3476" to-port="0" /> + <edge from-layer="3417" from-port="2" to-layer="3428" to-port="0" /> + <edge from-layer="3418" from-port="0" to-layer="3419" to-port="0" /> + <edge from-layer="3419" from-port="1" to-layer="3422" to-port="0" /> + <edge from-layer="3420" from-port="0" to-layer="3421" to-port="0" /> + <edge from-layer="3421" from-port="1" to-layer="3422" to-port="1" /> + <edge from-layer="3422" from-port="2" to-layer="3424" to-port="0" /> + <edge from-layer="3423" from-port="0" to-layer="3424" to-port="1" /> + <edge from-layer="3424" from-port="2" to-layer="3426" to-port="0" /> + <edge from-layer="3425" from-port="0" to-layer="3426" to-port="1" /> + <edge from-layer="3426" from-port="2" to-layer="3427" to-port="0" /> + <edge from-layer="3427" from-port="1" to-layer="3428" to-port="1" /> + <edge from-layer="3428" from-port="2" to-layer="3431" to-port="0" /> + <edge from-layer="3429" from-port="0" to-layer="3430" to-port="0" /> + <edge from-layer="3430" from-port="1" to-layer="3431" to-port="1" /> + <edge from-layer="3431" from-port="2" to-layer="3433" to-port="0" /> + <edge from-layer="3432" from-port="0" to-layer="3433" to-port="1" /> + <edge from-layer="3433" from-port="2" to-layer="3435" to-port="0" /> + <edge from-layer="3434" from-port="0" to-layer="3435" to-port="1" /> + <edge from-layer="3435" from-port="2" to-layer="3453" to-port="0" /> + <edge from-layer="3435" from-port="2" to-layer="3447" to-port="0" /> + <edge from-layer="3435" from-port="2" to-layer="3437" to-port="0" /> + <edge from-layer="3435" from-port="2" to-layer="3436" to-port="0" /> + <edge from-layer="3436" from-port="2" to-layer="3456" to-port="0" /> + <edge from-layer="3437" from-port="1" to-layer="3439" to-port="0" /> + <edge from-layer="3438" from-port="0" to-layer="3439" to-port="2" /> + <edge from-layer="3439" from-port="3" to-layer="3440" to-port="0" /> + <edge from-layer="3440" from-port="2" to-layer="3441" to-port="0" /> + <edge from-layer="3441" from-port="1" to-layer="3443" to-port="0" /> + <edge from-layer="3442" from-port="0" to-layer="3443" to-port="1" /> + <edge from-layer="3443" from-port="2" to-layer="3453" to-port="2" /> + <edge from-layer="3443" from-port="2" to-layer="3447" to-port="1" /> + <edge from-layer="3444" from-port="0" to-layer="3447" to-port="2" /> + <edge from-layer="3445" from-port="0" to-layer="3447" to-port="3" /> + <edge from-layer="3446" from-port="0" to-layer="3447" to-port="4" /> + <edge from-layer="3447" from-port="5" to-layer="3449" to-port="0" /> + <edge from-layer="3448" from-port="0" to-layer="3449" to-port="1" /> + <edge from-layer="3449" from-port="2" to-layer="3454" to-port="0" /> + <edge from-layer="3450" from-port="0" to-layer="3453" to-port="1" /> + <edge from-layer="3451" from-port="0" to-layer="3453" to-port="3" /> + <edge from-layer="3452" from-port="0" to-layer="3453" to-port="4" /> + <edge from-layer="3453" from-port="5" to-layer="3454" to-port="1" /> + <edge from-layer="3454" from-port="2" to-layer="3455" to-port="0" /> + <edge from-layer="3455" from-port="2" to-layer="3456" to-port="1" /> + <edge from-layer="3456" from-port="2" to-layer="3573" to-port="0" /> + <edge from-layer="3457" from-port="0" to-layer="3462" to-port="0" /> + <edge from-layer="3458" from-port="0" to-layer="3461" to-port="1" /> + <edge from-layer="3459" from-port="0" to-layer="3461" to-port="2" /> + <edge from-layer="3460" from-port="0" to-layer="3461" to-port="3" /> + <edge from-layer="3461" from-port="4" to-layer="3462" to-port="1" /> + <edge from-layer="3462" from-port="2" to-layer="3463" to-port="0" /> + <edge from-layer="3463" from-port="1" to-layer="3465" to-port="0" /> + <edge from-layer="3464" from-port="0" to-layer="3465" to-port="2" /> + <edge from-layer="3465" from-port="3" to-layer="3505" to-port="0" /> + <edge from-layer="3465" from-port="3" to-layer="3561" to-port="0" /> + <edge from-layer="3466" from-port="0" to-layer="3467" to-port="0" /> + <edge from-layer="3467" from-port="1" to-layer="3470" to-port="0" /> + <edge from-layer="3468" from-port="0" to-layer="3469" to-port="0" /> + <edge from-layer="3469" from-port="1" to-layer="3470" to-port="1" /> + <edge from-layer="3470" from-port="2" to-layer="3472" to-port="0" /> + <edge from-layer="3471" from-port="0" to-layer="3472" to-port="1" /> + <edge from-layer="3472" from-port="2" to-layer="3474" to-port="0" /> + <edge from-layer="3473" from-port="0" to-layer="3474" to-port="1" /> + <edge from-layer="3474" from-port="2" to-layer="3475" to-port="0" /> + <edge from-layer="3475" from-port="1" to-layer="3476" to-port="1" /> + <edge from-layer="3476" from-port="2" to-layer="3479" to-port="0" /> + <edge from-layer="3477" from-port="0" to-layer="3478" to-port="0" /> + <edge from-layer="3478" from-port="1" to-layer="3479" to-port="1" /> + <edge from-layer="3479" from-port="2" to-layer="3481" to-port="0" /> + <edge from-layer="3480" from-port="0" to-layer="3481" to-port="1" /> + <edge from-layer="3481" from-port="2" to-layer="3483" to-port="0" /> + <edge from-layer="3482" from-port="0" to-layer="3483" to-port="1" /> + <edge from-layer="3483" from-port="2" to-layer="3495" to-port="0" /> + <edge from-layer="3483" from-port="2" to-layer="3485" to-port="0" /> + <edge from-layer="3483" from-port="2" to-layer="3501" to-port="0" /> + <edge from-layer="3483" from-port="2" to-layer="3484" to-port="0" /> + <edge from-layer="3484" from-port="2" to-layer="3504" to-port="0" /> + <edge from-layer="3485" from-port="1" to-layer="3487" to-port="0" /> + <edge from-layer="3486" from-port="0" to-layer="3487" to-port="2" /> + <edge from-layer="3487" from-port="3" to-layer="3488" to-port="0" /> + <edge from-layer="3488" from-port="2" to-layer="3489" to-port="0" /> + <edge from-layer="3489" from-port="1" to-layer="3491" to-port="0" /> + <edge from-layer="3490" from-port="0" to-layer="3491" to-port="1" /> + <edge from-layer="3491" from-port="2" to-layer="3501" to-port="2" /> + <edge from-layer="3491" from-port="2" to-layer="3495" to-port="1" /> + <edge from-layer="3492" from-port="0" to-layer="3495" to-port="2" /> + <edge from-layer="3493" from-port="0" to-layer="3495" to-port="3" /> + <edge from-layer="3494" from-port="0" to-layer="3495" to-port="4" /> + <edge from-layer="3495" from-port="5" to-layer="3497" to-port="0" /> + <edge from-layer="3496" from-port="0" to-layer="3497" to-port="1" /> + <edge from-layer="3497" from-port="2" to-layer="3502" to-port="0" /> + <edge from-layer="3498" from-port="0" to-layer="3501" to-port="1" /> + <edge from-layer="3499" from-port="0" to-layer="3501" to-port="3" /> + <edge from-layer="3500" from-port="0" to-layer="3501" to-port="4" /> + <edge from-layer="3501" from-port="5" to-layer="3502" to-port="1" /> + <edge from-layer="3502" from-port="2" to-layer="3503" to-port="0" /> + <edge from-layer="3503" from-port="2" to-layer="3504" to-port="1" /> + <edge from-layer="3504" from-port="2" to-layer="3505" to-port="1" /> + <edge from-layer="3504" from-port="2" to-layer="3565" to-port="0" /> + <edge from-layer="3505" from-port="2" to-layer="3506" to-port="0" /> + <edge from-layer="3505" from-port="2" to-layer="11214" to-port="0" /> + <edge from-layer="3505" from-port="2" to-layer="3507" to-port="0" /> + <edge from-layer="3506" from-port="2" to-layer="3516" to-port="0" /> + <edge from-layer="3507" from-port="1" to-layer="3514" to-port="0" /> + <edge from-layer="3507" from-port="1" to-layer="3510" to-port="0" /> + <edge from-layer="3508" from-port="0" to-layer="3510" to-port="1" /> + <edge from-layer="3509" from-port="0" to-layer="3510" to-port="2" /> + <edge from-layer="3510" from-port="3" to-layer="3515" to-port="0" /> + <edge from-layer="3511" from-port="0" to-layer="3515" to-port="1" /> + <edge from-layer="3512" from-port="0" to-layer="3514" to-port="1" /> + <edge from-layer="3513" from-port="0" to-layer="3514" to-port="2" /> + <edge from-layer="3514" from-port="3" to-layer="3515" to-port="2" /> + <edge from-layer="3515" from-port="3" to-layer="3516" to-port="1" /> + <edge from-layer="3516" from-port="2" to-layer="3518" to-port="0" /> + <edge from-layer="3517" from-port="0" to-layer="3518" to-port="1" /> + <edge from-layer="3518" from-port="2" to-layer="3573" to-port="1" /> + <edge from-layer="3519" from-port="0" to-layer="3524" to-port="0" /> + <edge from-layer="3520" from-port="0" to-layer="3523" to-port="1" /> + <edge from-layer="3521" from-port="0" to-layer="3523" to-port="2" /> + <edge from-layer="3522" from-port="0" to-layer="3523" to-port="3" /> + <edge from-layer="3523" from-port="4" to-layer="3524" to-port="1" /> + <edge from-layer="3524" from-port="2" to-layer="3525" to-port="0" /> + <edge from-layer="3525" from-port="1" to-layer="3527" to-port="0" /> + <edge from-layer="3526" from-port="0" to-layer="3527" to-port="2" /> + <edge from-layer="3527" from-port="3" to-layer="3546" to-port="0" /> + <edge from-layer="3528" from-port="0" to-layer="3529" to-port="0" /> + <edge from-layer="3529" from-port="1" to-layer="3532" to-port="0" /> + <edge from-layer="3530" from-port="0" to-layer="3531" to-port="0" /> + <edge from-layer="3531" from-port="1" to-layer="3532" to-port="1" /> + <edge from-layer="3532" from-port="2" to-layer="3534" to-port="0" /> + <edge from-layer="3533" from-port="0" to-layer="3534" to-port="1" /> + <edge from-layer="3534" from-port="2" to-layer="3536" to-port="0" /> + <edge from-layer="3535" from-port="0" to-layer="3536" to-port="1" /> + <edge from-layer="3536" from-port="2" to-layer="3537" to-port="0" /> + <edge from-layer="3537" from-port="1" to-layer="3538" to-port="1" /> + <edge from-layer="3538" from-port="2" to-layer="3541" to-port="0" /> + <edge from-layer="3539" from-port="0" to-layer="3540" to-port="0" /> + <edge from-layer="3540" from-port="1" to-layer="3541" to-port="1" /> + <edge from-layer="3541" from-port="2" to-layer="3543" to-port="0" /> + <edge from-layer="3542" from-port="0" to-layer="3543" to-port="1" /> + <edge from-layer="3543" from-port="2" to-layer="3545" to-port="0" /> + <edge from-layer="3544" from-port="0" to-layer="3545" to-port="1" /> + <edge from-layer="3545" from-port="2" to-layer="3546" to-port="1" /> + <edge from-layer="3546" from-port="2" to-layer="11213" to-port="0" /> + <edge from-layer="3546" from-port="2" to-layer="3547" to-port="0" /> + <edge from-layer="3546" from-port="2" to-layer="3548" to-port="0" /> + <edge from-layer="3547" from-port="2" to-layer="3557" to-port="0" /> + <edge from-layer="3548" from-port="1" to-layer="3551" to-port="0" /> + <edge from-layer="3548" from-port="1" to-layer="3555" to-port="0" /> + <edge from-layer="3549" from-port="0" to-layer="3551" to-port="1" /> + <edge from-layer="3550" from-port="0" to-layer="3551" to-port="2" /> + <edge from-layer="3551" from-port="3" to-layer="3556" to-port="1" /> + <edge from-layer="3552" from-port="0" to-layer="3556" to-port="2" /> + <edge from-layer="3553" from-port="0" to-layer="3555" to-port="1" /> + <edge from-layer="3554" from-port="0" to-layer="3555" to-port="2" /> + <edge from-layer="3555" from-port="3" to-layer="3556" to-port="3" /> + <edge from-layer="3556" from-port="4" to-layer="3557" to-port="1" /> + <edge from-layer="3557" from-port="2" to-layer="3559" to-port="0" /> + <edge from-layer="3558" from-port="0" to-layer="3559" to-port="1" /> + <edge from-layer="3559" from-port="2" to-layer="3573" to-port="2" /> + <edge from-layer="3560" from-port="0" to-layer="3572" to-port="1" /> + <edge from-layer="3561" from-port="1" to-layer="3564" to-port="0" /> + <edge from-layer="3562" from-port="0" to-layer="3564" to-port="1" /> + <edge from-layer="3563" from-port="0" to-layer="3564" to-port="2" /> + <edge from-layer="3564" from-port="3" to-layer="3569" to-port="0" /> + <edge from-layer="3565" from-port="1" to-layer="3568" to-port="0" /> + <edge from-layer="3566" from-port="0" to-layer="3568" to-port="1" /> + <edge from-layer="3567" from-port="0" to-layer="3568" to-port="2" /> + <edge from-layer="3568" from-port="3" to-layer="3569" to-port="1" /> + <edge from-layer="3569" from-port="2" to-layer="3572" to-port="2" /> + <edge from-layer="3570" from-port="0" to-layer="3572" to-port="3" /> + <edge from-layer="3571" from-port="0" to-layer="3572" to-port="4" /> + <edge from-layer="3572" from-port="5" to-layer="3573" to-port="3" /> + <edge from-layer="3573" from-port="4" to-layer="3575" to-port="0" /> + <edge from-layer="3574" from-port="0" to-layer="3575" to-port="1" /> + <edge from-layer="3575" from-port="2" to-layer="3577" to-port="0" /> + <edge from-layer="3576" from-port="0" to-layer="3577" to-port="1" /> + <edge from-layer="3577" from-port="2" to-layer="3588" to-port="0" /> + <edge from-layer="3578" from-port="0" to-layer="3579" to-port="0" /> + <edge from-layer="3579" from-port="1" to-layer="3582" to-port="0" /> + <edge from-layer="3580" from-port="0" to-layer="3581" to-port="0" /> + <edge from-layer="3581" from-port="1" to-layer="3582" to-port="1" /> + <edge from-layer="3582" from-port="2" to-layer="3584" to-port="0" /> + <edge from-layer="3583" from-port="0" to-layer="3584" to-port="1" /> + <edge from-layer="3584" from-port="2" to-layer="3586" to-port="0" /> + <edge from-layer="3585" from-port="0" to-layer="3586" to-port="1" /> + <edge from-layer="3586" from-port="2" to-layer="3587" to-port="0" /> + <edge from-layer="3587" from-port="1" to-layer="3588" to-port="1" /> + <edge from-layer="3588" from-port="2" to-layer="3589" to-port="1" /> + <edge from-layer="3589" from-port="2" to-layer="3593" to-port="0" /> + <edge from-layer="3589" from-port="2" to-layer="3637" to-port="0" /> + <edge from-layer="3589" from-port="2" to-layer="3600" to-port="0" /> + <edge from-layer="3590" from-port="0" to-layer="3601" to-port="0" /> + <edge from-layer="3591" from-port="0" to-layer="3599" to-port="0" /> + <edge from-layer="3592" from-port="0" to-layer="3593" to-port="1" /> + <edge from-layer="3593" from-port="2" to-layer="3595" to-port="0" /> + <edge from-layer="3594" from-port="0" to-layer="3595" to-port="1" /> + <edge from-layer="3595" from-port="2" to-layer="3597" to-port="0" /> + <edge from-layer="3596" from-port="0" to-layer="3597" to-port="1" /> + <edge from-layer="3597" from-port="2" to-layer="3598" to-port="0" /> + <edge from-layer="3598" from-port="1" to-layer="3599" to-port="1" /> + <edge from-layer="3599" from-port="2" to-layer="3600" to-port="1" /> + <edge from-layer="3600" from-port="2" to-layer="3601" to-port="1" /> + <edge from-layer="3601" from-port="2" to-layer="3624" to-port="0" /> + <edge from-layer="3601" from-port="2" to-layer="3612" to-port="0" /> + <edge from-layer="3602" from-port="0" to-layer="3603" to-port="0" /> + <edge from-layer="3603" from-port="1" to-layer="3606" to-port="0" /> + <edge from-layer="3604" from-port="0" to-layer="3605" to-port="0" /> + <edge from-layer="3605" from-port="1" to-layer="3606" to-port="1" /> + <edge from-layer="3606" from-port="2" to-layer="3608" to-port="0" /> + <edge from-layer="3607" from-port="0" to-layer="3608" to-port="1" /> + <edge from-layer="3608" from-port="2" to-layer="3610" to-port="0" /> + <edge from-layer="3609" from-port="0" to-layer="3610" to-port="1" /> + <edge from-layer="3610" from-port="2" to-layer="3611" to-port="0" /> + <edge from-layer="3611" from-port="1" to-layer="3612" to-port="1" /> + <edge from-layer="3612" from-port="2" to-layer="3613" to-port="0" /> + <edge from-layer="3613" from-port="1" to-layer="3625" to-port="0" /> + <edge from-layer="3614" from-port="0" to-layer="3615" to-port="0" /> + <edge from-layer="3615" from-port="1" to-layer="3618" to-port="0" /> + <edge from-layer="3616" from-port="0" to-layer="3617" to-port="0" /> + <edge from-layer="3617" from-port="1" to-layer="3618" to-port="1" /> + <edge from-layer="3618" from-port="2" to-layer="3620" to-port="0" /> + <edge from-layer="3619" from-port="0" to-layer="3620" to-port="1" /> + <edge from-layer="3620" from-port="2" to-layer="3622" to-port="0" /> + <edge from-layer="3621" from-port="0" to-layer="3622" to-port="1" /> + <edge from-layer="3622" from-port="2" to-layer="3623" to-port="0" /> + <edge from-layer="3623" from-port="1" to-layer="3624" to-port="1" /> + <edge from-layer="3624" from-port="2" to-layer="3625" to-port="1" /> + <edge from-layer="3625" from-port="2" to-layer="3636" to-port="0" /> + <edge from-layer="3626" from-port="0" to-layer="3627" to-port="0" /> + <edge from-layer="3627" from-port="1" to-layer="3630" to-port="0" /> + <edge from-layer="3628" from-port="0" to-layer="3629" to-port="0" /> + <edge from-layer="3629" from-port="1" to-layer="3630" to-port="1" /> + <edge from-layer="3630" from-port="2" to-layer="3632" to-port="0" /> + <edge from-layer="3631" from-port="0" to-layer="3632" to-port="1" /> + <edge from-layer="3632" from-port="2" to-layer="3634" to-port="0" /> + <edge from-layer="3633" from-port="0" to-layer="3634" to-port="1" /> + <edge from-layer="3634" from-port="2" to-layer="3635" to-port="0" /> + <edge from-layer="3635" from-port="1" to-layer="3636" to-port="1" /> + <edge from-layer="3636" from-port="2" to-layer="3637" to-port="1" /> + <edge from-layer="3637" from-port="2" to-layer="3641" to-port="0" /> + <edge from-layer="3637" from-port="2" to-layer="3648" to-port="0" /> + <edge from-layer="3637" from-port="2" to-layer="3821" to-port="0" /> + <edge from-layer="3638" from-port="0" to-layer="3649" to-port="0" /> + <edge from-layer="3639" from-port="0" to-layer="3647" to-port="0" /> + <edge from-layer="3640" from-port="0" to-layer="3641" to-port="1" /> + <edge from-layer="3641" from-port="2" to-layer="3643" to-port="0" /> + <edge from-layer="3642" from-port="0" to-layer="3643" to-port="1" /> + <edge from-layer="3643" from-port="2" to-layer="3645" to-port="0" /> + <edge from-layer="3644" from-port="0" to-layer="3645" to-port="1" /> + <edge from-layer="3645" from-port="2" to-layer="3646" to-port="0" /> + <edge from-layer="3646" from-port="1" to-layer="3647" to-port="1" /> + <edge from-layer="3647" from-port="2" to-layer="3648" to-port="1" /> + <edge from-layer="3648" from-port="2" to-layer="3649" to-port="1" /> + <edge from-layer="3649" from-port="2" to-layer="3708" to-port="0" /> + <edge from-layer="3649" from-port="2" to-layer="3770" to-port="0" /> + <edge from-layer="3649" from-port="2" to-layer="3660" to-port="0" /> + <edge from-layer="3650" from-port="0" to-layer="3651" to-port="0" /> + <edge from-layer="3651" from-port="1" to-layer="3654" to-port="0" /> + <edge from-layer="3652" from-port="0" to-layer="3653" to-port="0" /> + <edge from-layer="3653" from-port="1" to-layer="3654" to-port="1" /> + <edge from-layer="3654" from-port="2" to-layer="3656" to-port="0" /> + <edge from-layer="3655" from-port="0" to-layer="3656" to-port="1" /> + <edge from-layer="3656" from-port="2" to-layer="3658" to-port="0" /> + <edge from-layer="3657" from-port="0" to-layer="3658" to-port="1" /> + <edge from-layer="3658" from-port="2" to-layer="3659" to-port="0" /> + <edge from-layer="3659" from-port="1" to-layer="3660" to-port="1" /> + <edge from-layer="3660" from-port="2" to-layer="3663" to-port="0" /> + <edge from-layer="3661" from-port="0" to-layer="3662" to-port="0" /> + <edge from-layer="3662" from-port="1" to-layer="3663" to-port="1" /> + <edge from-layer="3663" from-port="2" to-layer="3665" to-port="0" /> + <edge from-layer="3664" from-port="0" to-layer="3665" to-port="1" /> + <edge from-layer="3665" from-port="2" to-layer="3667" to-port="0" /> + <edge from-layer="3666" from-port="0" to-layer="3667" to-port="1" /> + <edge from-layer="3667" from-port="2" to-layer="3685" to-port="0" /> + <edge from-layer="3667" from-port="2" to-layer="3668" to-port="0" /> + <edge from-layer="3667" from-port="2" to-layer="3669" to-port="0" /> + <edge from-layer="3667" from-port="2" to-layer="3679" to-port="0" /> + <edge from-layer="3668" from-port="2" to-layer="3688" to-port="0" /> + <edge from-layer="3669" from-port="1" to-layer="3671" to-port="0" /> + <edge from-layer="3670" from-port="0" to-layer="3671" to-port="2" /> + <edge from-layer="3671" from-port="3" to-layer="3672" to-port="0" /> + <edge from-layer="3672" from-port="2" to-layer="3673" to-port="0" /> + <edge from-layer="3673" from-port="1" to-layer="3675" to-port="0" /> + <edge from-layer="3674" from-port="0" to-layer="3675" to-port="1" /> + <edge from-layer="3675" from-port="2" to-layer="3679" to-port="1" /> + <edge from-layer="3675" from-port="2" to-layer="3685" to-port="2" /> + <edge from-layer="3676" from-port="0" to-layer="3679" to-port="2" /> + <edge from-layer="3677" from-port="0" to-layer="3679" to-port="3" /> + <edge from-layer="3678" from-port="0" to-layer="3679" to-port="4" /> + <edge from-layer="3679" from-port="5" to-layer="3681" to-port="0" /> + <edge from-layer="3680" from-port="0" to-layer="3681" to-port="1" /> + <edge from-layer="3681" from-port="2" to-layer="3686" to-port="0" /> + <edge from-layer="3682" from-port="0" to-layer="3685" to-port="1" /> + <edge from-layer="3683" from-port="0" to-layer="3685" to-port="3" /> + <edge from-layer="3684" from-port="0" to-layer="3685" to-port="4" /> + <edge from-layer="3685" from-port="5" to-layer="3686" to-port="1" /> + <edge from-layer="3686" from-port="2" to-layer="3687" to-port="0" /> + <edge from-layer="3687" from-port="2" to-layer="3688" to-port="1" /> + <edge from-layer="3688" from-port="2" to-layer="3805" to-port="0" /> + <edge from-layer="3689" from-port="0" to-layer="3694" to-port="0" /> + <edge from-layer="3690" from-port="0" to-layer="3693" to-port="1" /> + <edge from-layer="3691" from-port="0" to-layer="3693" to-port="2" /> + <edge from-layer="3692" from-port="0" to-layer="3693" to-port="3" /> + <edge from-layer="3693" from-port="4" to-layer="3694" to-port="1" /> + <edge from-layer="3694" from-port="2" to-layer="3695" to-port="0" /> + <edge from-layer="3695" from-port="1" to-layer="3697" to-port="0" /> + <edge from-layer="3696" from-port="0" to-layer="3697" to-port="2" /> + <edge from-layer="3697" from-port="3" to-layer="3793" to-port="0" /> + <edge from-layer="3697" from-port="3" to-layer="3737" to-port="0" /> + <edge from-layer="3698" from-port="0" to-layer="3699" to-port="0" /> + <edge from-layer="3699" from-port="1" to-layer="3702" to-port="0" /> + <edge from-layer="3700" from-port="0" to-layer="3701" to-port="0" /> + <edge from-layer="3701" from-port="1" to-layer="3702" to-port="1" /> + <edge from-layer="3702" from-port="2" to-layer="3704" to-port="0" /> + <edge from-layer="3703" from-port="0" to-layer="3704" to-port="1" /> + <edge from-layer="3704" from-port="2" to-layer="3706" to-port="0" /> + <edge from-layer="3705" from-port="0" to-layer="3706" to-port="1" /> + <edge from-layer="3706" from-port="2" to-layer="3707" to-port="0" /> + <edge from-layer="3707" from-port="1" to-layer="3708" to-port="1" /> + <edge from-layer="3708" from-port="2" to-layer="3711" to-port="0" /> + <edge from-layer="3709" from-port="0" to-layer="3710" to-port="0" /> + <edge from-layer="3710" from-port="1" to-layer="3711" to-port="1" /> + <edge from-layer="3711" from-port="2" to-layer="3713" to-port="0" /> + <edge from-layer="3712" from-port="0" to-layer="3713" to-port="1" /> + <edge from-layer="3713" from-port="2" to-layer="3715" to-port="0" /> + <edge from-layer="3714" from-port="0" to-layer="3715" to-port="1" /> + <edge from-layer="3715" from-port="2" to-layer="3716" to-port="0" /> + <edge from-layer="3715" from-port="2" to-layer="3717" to-port="0" /> + <edge from-layer="3715" from-port="2" to-layer="3727" to-port="0" /> + <edge from-layer="3715" from-port="2" to-layer="3733" to-port="0" /> + <edge from-layer="3716" from-port="2" to-layer="3736" to-port="0" /> + <edge from-layer="3717" from-port="1" to-layer="3719" to-port="0" /> + <edge from-layer="3718" from-port="0" to-layer="3719" to-port="2" /> + <edge from-layer="3719" from-port="3" to-layer="3720" to-port="0" /> + <edge from-layer="3720" from-port="2" to-layer="3721" to-port="0" /> + <edge from-layer="3721" from-port="1" to-layer="3723" to-port="0" /> + <edge from-layer="3722" from-port="0" to-layer="3723" to-port="1" /> + <edge from-layer="3723" from-port="2" to-layer="3727" to-port="1" /> + <edge from-layer="3723" from-port="2" to-layer="3733" to-port="2" /> + <edge from-layer="3724" from-port="0" to-layer="3727" to-port="2" /> + <edge from-layer="3725" from-port="0" to-layer="3727" to-port="3" /> + <edge from-layer="3726" from-port="0" to-layer="3727" to-port="4" /> + <edge from-layer="3727" from-port="5" to-layer="3729" to-port="0" /> + <edge from-layer="3728" from-port="0" to-layer="3729" to-port="1" /> + <edge from-layer="3729" from-port="2" to-layer="3734" to-port="0" /> + <edge from-layer="3730" from-port="0" to-layer="3733" to-port="1" /> + <edge from-layer="3731" from-port="0" to-layer="3733" to-port="3" /> + <edge from-layer="3732" from-port="0" to-layer="3733" to-port="4" /> + <edge from-layer="3733" from-port="5" to-layer="3734" to-port="1" /> + <edge from-layer="3734" from-port="2" to-layer="3735" to-port="0" /> + <edge from-layer="3735" from-port="2" to-layer="3736" to-port="1" /> + <edge from-layer="3736" from-port="2" to-layer="3737" to-port="1" /> + <edge from-layer="3736" from-port="2" to-layer="3797" to-port="0" /> + <edge from-layer="3737" from-port="2" to-layer="11212" to-port="0" /> + <edge from-layer="3737" from-port="2" to-layer="3738" to-port="0" /> + <edge from-layer="3737" from-port="2" to-layer="3739" to-port="0" /> + <edge from-layer="3738" from-port="2" to-layer="3748" to-port="0" /> + <edge from-layer="3739" from-port="1" to-layer="3746" to-port="0" /> + <edge from-layer="3739" from-port="1" to-layer="3742" to-port="0" /> + <edge from-layer="3740" from-port="0" to-layer="3742" to-port="1" /> + <edge from-layer="3741" from-port="0" to-layer="3742" to-port="2" /> + <edge from-layer="3742" from-port="3" to-layer="3747" to-port="0" /> + <edge from-layer="3743" from-port="0" to-layer="3747" to-port="1" /> + <edge from-layer="3744" from-port="0" to-layer="3746" to-port="1" /> + <edge from-layer="3745" from-port="0" to-layer="3746" to-port="2" /> + <edge from-layer="3746" from-port="3" to-layer="3747" to-port="2" /> + <edge from-layer="3747" from-port="3" to-layer="3748" to-port="1" /> + <edge from-layer="3748" from-port="2" to-layer="3750" to-port="0" /> + <edge from-layer="3749" from-port="0" to-layer="3750" to-port="1" /> + <edge from-layer="3750" from-port="2" to-layer="3805" to-port="1" /> + <edge from-layer="3751" from-port="0" to-layer="3756" to-port="0" /> + <edge from-layer="3752" from-port="0" to-layer="3755" to-port="1" /> + <edge from-layer="3753" from-port="0" to-layer="3755" to-port="2" /> + <edge from-layer="3754" from-port="0" to-layer="3755" to-port="3" /> + <edge from-layer="3755" from-port="4" to-layer="3756" to-port="1" /> + <edge from-layer="3756" from-port="2" to-layer="3757" to-port="0" /> + <edge from-layer="3757" from-port="1" to-layer="3759" to-port="0" /> + <edge from-layer="3758" from-port="0" to-layer="3759" to-port="2" /> + <edge from-layer="3759" from-port="3" to-layer="3778" to-port="0" /> + <edge from-layer="3760" from-port="0" to-layer="3761" to-port="0" /> + <edge from-layer="3761" from-port="1" to-layer="3764" to-port="0" /> + <edge from-layer="3762" from-port="0" to-layer="3763" to-port="0" /> + <edge from-layer="3763" from-port="1" to-layer="3764" to-port="1" /> + <edge from-layer="3764" from-port="2" to-layer="3766" to-port="0" /> + <edge from-layer="3765" from-port="0" to-layer="3766" to-port="1" /> + <edge from-layer="3766" from-port="2" to-layer="3768" to-port="0" /> + <edge from-layer="3767" from-port="0" to-layer="3768" to-port="1" /> + <edge from-layer="3768" from-port="2" to-layer="3769" to-port="0" /> + <edge from-layer="3769" from-port="1" to-layer="3770" to-port="1" /> + <edge from-layer="3770" from-port="2" to-layer="3773" to-port="0" /> + <edge from-layer="3771" from-port="0" to-layer="3772" to-port="0" /> + <edge from-layer="3772" from-port="1" to-layer="3773" to-port="1" /> + <edge from-layer="3773" from-port="2" to-layer="3775" to-port="0" /> + <edge from-layer="3774" from-port="0" to-layer="3775" to-port="1" /> + <edge from-layer="3775" from-port="2" to-layer="3777" to-port="0" /> + <edge from-layer="3776" from-port="0" to-layer="3777" to-port="1" /> + <edge from-layer="3777" from-port="2" to-layer="3778" to-port="1" /> + <edge from-layer="3778" from-port="2" to-layer="3779" to-port="0" /> + <edge from-layer="3778" from-port="2" to-layer="3780" to-port="0" /> + <edge from-layer="3778" from-port="2" to-layer="11211" to-port="0" /> + <edge from-layer="3779" from-port="2" to-layer="3789" to-port="0" /> + <edge from-layer="3780" from-port="1" to-layer="3783" to-port="0" /> + <edge from-layer="3780" from-port="1" to-layer="3787" to-port="0" /> + <edge from-layer="3781" from-port="0" to-layer="3783" to-port="1" /> + <edge from-layer="3782" from-port="0" to-layer="3783" to-port="2" /> + <edge from-layer="3783" from-port="3" to-layer="3788" to-port="1" /> + <edge from-layer="3784" from-port="0" to-layer="3788" to-port="2" /> + <edge from-layer="3785" from-port="0" to-layer="3787" to-port="1" /> + <edge from-layer="3786" from-port="0" to-layer="3787" to-port="2" /> + <edge from-layer="3787" from-port="3" to-layer="3788" to-port="3" /> + <edge from-layer="3788" from-port="4" to-layer="3789" to-port="1" /> + <edge from-layer="3789" from-port="2" to-layer="3791" to-port="0" /> + <edge from-layer="3790" from-port="0" to-layer="3791" to-port="1" /> + <edge from-layer="3791" from-port="2" to-layer="3805" to-port="2" /> + <edge from-layer="3792" from-port="0" to-layer="3804" to-port="1" /> + <edge from-layer="3793" from-port="1" to-layer="3796" to-port="0" /> + <edge from-layer="3794" from-port="0" to-layer="3796" to-port="1" /> + <edge from-layer="3795" from-port="0" to-layer="3796" to-port="2" /> + <edge from-layer="3796" from-port="3" to-layer="3801" to-port="0" /> + <edge from-layer="3797" from-port="1" to-layer="3800" to-port="0" /> + <edge from-layer="3798" from-port="0" to-layer="3800" to-port="1" /> + <edge from-layer="3799" from-port="0" to-layer="3800" to-port="2" /> + <edge from-layer="3800" from-port="3" to-layer="3801" to-port="1" /> + <edge from-layer="3801" from-port="2" to-layer="3804" to-port="2" /> + <edge from-layer="3802" from-port="0" to-layer="3804" to-port="3" /> + <edge from-layer="3803" from-port="0" to-layer="3804" to-port="4" /> + <edge from-layer="3804" from-port="5" to-layer="3805" to-port="3" /> + <edge from-layer="3805" from-port="4" to-layer="3807" to-port="0" /> + <edge from-layer="3806" from-port="0" to-layer="3807" to-port="1" /> + <edge from-layer="3807" from-port="2" to-layer="3809" to-port="0" /> + <edge from-layer="3808" from-port="0" to-layer="3809" to-port="1" /> + <edge from-layer="3809" from-port="2" to-layer="3820" to-port="0" /> + <edge from-layer="3810" from-port="0" to-layer="3811" to-port="0" /> + <edge from-layer="3811" from-port="1" to-layer="3814" to-port="0" /> + <edge from-layer="3812" from-port="0" to-layer="3813" to-port="0" /> + <edge from-layer="3813" from-port="1" to-layer="3814" to-port="1" /> + <edge from-layer="3814" from-port="2" to-layer="3816" to-port="0" /> + <edge from-layer="3815" from-port="0" to-layer="3816" to-port="1" /> + <edge from-layer="3816" from-port="2" to-layer="3818" to-port="0" /> + <edge from-layer="3817" from-port="0" to-layer="3818" to-port="1" /> + <edge from-layer="3818" from-port="2" to-layer="3819" to-port="0" /> + <edge from-layer="3819" from-port="1" to-layer="3820" to-port="1" /> + <edge from-layer="3820" from-port="2" to-layer="3821" to-port="1" /> + <edge from-layer="3821" from-port="2" to-layer="3832" to-port="0" /> + <edge from-layer="3821" from-port="2" to-layer="3825" to-port="0" /> + <edge from-layer="3821" from-port="2" to-layer="3869" to-port="0" /> + <edge from-layer="3822" from-port="0" to-layer="3833" to-port="0" /> + <edge from-layer="3823" from-port="0" to-layer="3831" to-port="0" /> + <edge from-layer="3824" from-port="0" to-layer="3825" to-port="1" /> + <edge from-layer="3825" from-port="2" to-layer="3827" to-port="0" /> + <edge from-layer="3826" from-port="0" to-layer="3827" to-port="1" /> + <edge from-layer="3827" from-port="2" to-layer="3829" to-port="0" /> + <edge from-layer="3828" from-port="0" to-layer="3829" to-port="1" /> + <edge from-layer="3829" from-port="2" to-layer="3830" to-port="0" /> + <edge from-layer="3830" from-port="1" to-layer="3831" to-port="1" /> + <edge from-layer="3831" from-port="2" to-layer="3832" to-port="1" /> + <edge from-layer="3832" from-port="2" to-layer="3833" to-port="1" /> + <edge from-layer="3833" from-port="2" to-layer="3856" to-port="0" /> + <edge from-layer="3833" from-port="2" to-layer="3844" to-port="0" /> + <edge from-layer="3834" from-port="0" to-layer="3835" to-port="0" /> + <edge from-layer="3835" from-port="1" to-layer="3838" to-port="0" /> + <edge from-layer="3836" from-port="0" to-layer="3837" to-port="0" /> + <edge from-layer="3837" from-port="1" to-layer="3838" to-port="1" /> + <edge from-layer="3838" from-port="2" to-layer="3840" to-port="0" /> + <edge from-layer="3839" from-port="0" to-layer="3840" to-port="1" /> + <edge from-layer="3840" from-port="2" to-layer="3842" to-port="0" /> + <edge from-layer="3841" from-port="0" to-layer="3842" to-port="1" /> + <edge from-layer="3842" from-port="2" to-layer="3843" to-port="0" /> + <edge from-layer="3843" from-port="1" to-layer="3844" to-port="1" /> + <edge from-layer="3844" from-port="2" to-layer="3845" to-port="0" /> + <edge from-layer="3845" from-port="1" to-layer="3857" to-port="0" /> + <edge from-layer="3846" from-port="0" to-layer="3847" to-port="0" /> + <edge from-layer="3847" from-port="1" to-layer="3850" to-port="0" /> + <edge from-layer="3848" from-port="0" to-layer="3849" to-port="0" /> + <edge from-layer="3849" from-port="1" to-layer="3850" to-port="1" /> + <edge from-layer="3850" from-port="2" to-layer="3852" to-port="0" /> + <edge from-layer="3851" from-port="0" to-layer="3852" to-port="1" /> + <edge from-layer="3852" from-port="2" to-layer="3854" to-port="0" /> + <edge from-layer="3853" from-port="0" to-layer="3854" to-port="1" /> + <edge from-layer="3854" from-port="2" to-layer="3855" to-port="0" /> + <edge from-layer="3855" from-port="1" to-layer="3856" to-port="1" /> + <edge from-layer="3856" from-port="2" to-layer="3857" to-port="1" /> + <edge from-layer="3857" from-port="2" to-layer="3868" to-port="0" /> + <edge from-layer="3858" from-port="0" to-layer="3859" to-port="0" /> + <edge from-layer="3859" from-port="1" to-layer="3862" to-port="0" /> + <edge from-layer="3860" from-port="0" to-layer="3861" to-port="0" /> + <edge from-layer="3861" from-port="1" to-layer="3862" to-port="1" /> + <edge from-layer="3862" from-port="2" to-layer="3864" to-port="0" /> + <edge from-layer="3863" from-port="0" to-layer="3864" to-port="1" /> + <edge from-layer="3864" from-port="2" to-layer="3866" to-port="0" /> + <edge from-layer="3865" from-port="0" to-layer="3866" to-port="1" /> + <edge from-layer="3866" from-port="2" to-layer="3867" to-port="0" /> + <edge from-layer="3867" from-port="1" to-layer="3868" to-port="1" /> + <edge from-layer="3868" from-port="2" to-layer="3869" to-port="1" /> + <edge from-layer="3869" from-port="2" to-layer="3880" to-port="0" /> + <edge from-layer="3869" from-port="2" to-layer="4053" to-port="0" /> + <edge from-layer="3869" from-port="2" to-layer="3873" to-port="0" /> + <edge from-layer="3870" from-port="0" to-layer="3881" to-port="0" /> + <edge from-layer="3871" from-port="0" to-layer="3879" to-port="0" /> + <edge from-layer="3872" from-port="0" to-layer="3873" to-port="1" /> + <edge from-layer="3873" from-port="2" to-layer="3875" to-port="0" /> + <edge from-layer="3874" from-port="0" to-layer="3875" to-port="1" /> + <edge from-layer="3875" from-port="2" to-layer="3877" to-port="0" /> + <edge from-layer="3876" from-port="0" to-layer="3877" to-port="1" /> + <edge from-layer="3877" from-port="2" to-layer="3878" to-port="0" /> + <edge from-layer="3878" from-port="1" to-layer="3879" to-port="1" /> + <edge from-layer="3879" from-port="2" to-layer="3880" to-port="1" /> + <edge from-layer="3880" from-port="2" to-layer="3881" to-port="1" /> + <edge from-layer="3881" from-port="2" to-layer="3892" to-port="0" /> + <edge from-layer="3881" from-port="2" to-layer="4002" to-port="0" /> + <edge from-layer="3881" from-port="2" to-layer="3940" to-port="0" /> + <edge from-layer="3882" from-port="0" to-layer="3883" to-port="0" /> + <edge from-layer="3883" from-port="1" to-layer="3886" to-port="0" /> + <edge from-layer="3884" from-port="0" to-layer="3885" to-port="0" /> + <edge from-layer="3885" from-port="1" to-layer="3886" to-port="1" /> + <edge from-layer="3886" from-port="2" to-layer="3888" to-port="0" /> + <edge from-layer="3887" from-port="0" to-layer="3888" to-port="1" /> + <edge from-layer="3888" from-port="2" to-layer="3890" to-port="0" /> + <edge from-layer="3889" from-port="0" to-layer="3890" to-port="1" /> + <edge from-layer="3890" from-port="2" to-layer="3891" to-port="0" /> + <edge from-layer="3891" from-port="1" to-layer="3892" to-port="1" /> + <edge from-layer="3892" from-port="2" to-layer="3895" to-port="0" /> + <edge from-layer="3893" from-port="0" to-layer="3894" to-port="0" /> + <edge from-layer="3894" from-port="1" to-layer="3895" to-port="1" /> + <edge from-layer="3895" from-port="2" to-layer="3897" to-port="0" /> + <edge from-layer="3896" from-port="0" to-layer="3897" to-port="1" /> + <edge from-layer="3897" from-port="2" to-layer="3899" to-port="0" /> + <edge from-layer="3898" from-port="0" to-layer="3899" to-port="1" /> + <edge from-layer="3899" from-port="2" to-layer="3917" to-port="0" /> + <edge from-layer="3899" from-port="2" to-layer="3900" to-port="0" /> + <edge from-layer="3899" from-port="2" to-layer="3911" to-port="0" /> + <edge from-layer="3899" from-port="2" to-layer="3901" to-port="0" /> + <edge from-layer="3900" from-port="2" to-layer="3920" to-port="0" /> + <edge from-layer="3901" from-port="1" to-layer="3903" to-port="0" /> + <edge from-layer="3902" from-port="0" to-layer="3903" to-port="2" /> + <edge from-layer="3903" from-port="3" to-layer="3904" to-port="0" /> + <edge from-layer="3904" from-port="2" to-layer="3905" to-port="0" /> + <edge from-layer="3905" from-port="1" to-layer="3907" to-port="0" /> + <edge from-layer="3906" from-port="0" to-layer="3907" to-port="1" /> + <edge from-layer="3907" from-port="2" to-layer="3911" to-port="1" /> + <edge from-layer="3907" from-port="2" to-layer="3917" to-port="2" /> + <edge from-layer="3908" from-port="0" to-layer="3911" to-port="2" /> + <edge from-layer="3909" from-port="0" to-layer="3911" to-port="3" /> + <edge from-layer="3910" from-port="0" to-layer="3911" to-port="4" /> + <edge from-layer="3911" from-port="5" to-layer="3913" to-port="0" /> + <edge from-layer="3912" from-port="0" to-layer="3913" to-port="1" /> + <edge from-layer="3913" from-port="2" to-layer="3918" to-port="0" /> + <edge from-layer="3914" from-port="0" to-layer="3917" to-port="1" /> + <edge from-layer="3915" from-port="0" to-layer="3917" to-port="3" /> + <edge from-layer="3916" from-port="0" to-layer="3917" to-port="4" /> + <edge from-layer="3917" from-port="5" to-layer="3918" to-port="1" /> + <edge from-layer="3918" from-port="2" to-layer="3919" to-port="0" /> + <edge from-layer="3919" from-port="2" to-layer="3920" to-port="1" /> + <edge from-layer="3920" from-port="2" to-layer="4037" to-port="0" /> + <edge from-layer="3921" from-port="0" to-layer="3926" to-port="0" /> + <edge from-layer="3922" from-port="0" to-layer="3925" to-port="1" /> + <edge from-layer="3923" from-port="0" to-layer="3925" to-port="2" /> + <edge from-layer="3924" from-port="0" to-layer="3925" to-port="3" /> + <edge from-layer="3925" from-port="4" to-layer="3926" to-port="1" /> + <edge from-layer="3926" from-port="2" to-layer="3927" to-port="0" /> + <edge from-layer="3927" from-port="1" to-layer="3929" to-port="0" /> + <edge from-layer="3928" from-port="0" to-layer="3929" to-port="2" /> + <edge from-layer="3929" from-port="3" to-layer="3969" to-port="0" /> + <edge from-layer="3929" from-port="3" to-layer="4025" to-port="0" /> + <edge from-layer="3930" from-port="0" to-layer="3931" to-port="0" /> + <edge from-layer="3931" from-port="1" to-layer="3934" to-port="0" /> + <edge from-layer="3932" from-port="0" to-layer="3933" to-port="0" /> + <edge from-layer="3933" from-port="1" to-layer="3934" to-port="1" /> + <edge from-layer="3934" from-port="2" to-layer="3936" to-port="0" /> + <edge from-layer="3935" from-port="0" to-layer="3936" to-port="1" /> + <edge from-layer="3936" from-port="2" to-layer="3938" to-port="0" /> + <edge from-layer="3937" from-port="0" to-layer="3938" to-port="1" /> + <edge from-layer="3938" from-port="2" to-layer="3939" to-port="0" /> + <edge from-layer="3939" from-port="1" to-layer="3940" to-port="1" /> + <edge from-layer="3940" from-port="2" to-layer="3943" to-port="0" /> + <edge from-layer="3941" from-port="0" to-layer="3942" to-port="0" /> + <edge from-layer="3942" from-port="1" to-layer="3943" to-port="1" /> + <edge from-layer="3943" from-port="2" to-layer="3945" to-port="0" /> + <edge from-layer="3944" from-port="0" to-layer="3945" to-port="1" /> + <edge from-layer="3945" from-port="2" to-layer="3947" to-port="0" /> + <edge from-layer="3946" from-port="0" to-layer="3947" to-port="1" /> + <edge from-layer="3947" from-port="2" to-layer="3948" to-port="0" /> + <edge from-layer="3947" from-port="2" to-layer="3959" to-port="0" /> + <edge from-layer="3947" from-port="2" to-layer="3949" to-port="0" /> + <edge from-layer="3947" from-port="2" to-layer="3965" to-port="0" /> + <edge from-layer="3948" from-port="2" to-layer="3968" to-port="0" /> + <edge from-layer="3949" from-port="1" to-layer="3951" to-port="0" /> + <edge from-layer="3950" from-port="0" to-layer="3951" to-port="2" /> + <edge from-layer="3951" from-port="3" to-layer="3952" to-port="0" /> + <edge from-layer="3952" from-port="2" to-layer="3953" to-port="0" /> + <edge from-layer="3953" from-port="1" to-layer="3955" to-port="0" /> + <edge from-layer="3954" from-port="0" to-layer="3955" to-port="1" /> + <edge from-layer="3955" from-port="2" to-layer="3959" to-port="1" /> + <edge from-layer="3955" from-port="2" to-layer="3965" to-port="2" /> + <edge from-layer="3956" from-port="0" to-layer="3959" to-port="2" /> + <edge from-layer="3957" from-port="0" to-layer="3959" to-port="3" /> + <edge from-layer="3958" from-port="0" to-layer="3959" to-port="4" /> + <edge from-layer="3959" from-port="5" to-layer="3961" to-port="0" /> + <edge from-layer="3960" from-port="0" to-layer="3961" to-port="1" /> + <edge from-layer="3961" from-port="2" to-layer="3966" to-port="0" /> + <edge from-layer="3962" from-port="0" to-layer="3965" to-port="1" /> + <edge from-layer="3963" from-port="0" to-layer="3965" to-port="3" /> + <edge from-layer="3964" from-port="0" to-layer="3965" to-port="4" /> + <edge from-layer="3965" from-port="5" to-layer="3966" to-port="1" /> + <edge from-layer="3966" from-port="2" to-layer="3967" to-port="0" /> + <edge from-layer="3967" from-port="2" to-layer="3968" to-port="1" /> + <edge from-layer="3968" from-port="2" to-layer="3969" to-port="1" /> + <edge from-layer="3968" from-port="2" to-layer="4029" to-port="0" /> + <edge from-layer="3969" from-port="2" to-layer="11210" to-port="0" /> + <edge from-layer="3969" from-port="2" to-layer="3971" to-port="0" /> + <edge from-layer="3969" from-port="2" to-layer="3970" to-port="0" /> + <edge from-layer="3970" from-port="2" to-layer="3980" to-port="0" /> + <edge from-layer="3971" from-port="1" to-layer="3974" to-port="0" /> + <edge from-layer="3971" from-port="1" to-layer="3978" to-port="0" /> + <edge from-layer="3972" from-port="0" to-layer="3974" to-port="1" /> + <edge from-layer="3973" from-port="0" to-layer="3974" to-port="2" /> + <edge from-layer="3974" from-port="3" to-layer="3979" to-port="0" /> + <edge from-layer="3975" from-port="0" to-layer="3979" to-port="1" /> + <edge from-layer="3976" from-port="0" to-layer="3978" to-port="1" /> + <edge from-layer="3977" from-port="0" to-layer="3978" to-port="2" /> + <edge from-layer="3978" from-port="3" to-layer="3979" to-port="2" /> + <edge from-layer="3979" from-port="3" to-layer="3980" to-port="1" /> + <edge from-layer="3980" from-port="2" to-layer="3982" to-port="0" /> + <edge from-layer="3981" from-port="0" to-layer="3982" to-port="1" /> + <edge from-layer="3982" from-port="2" to-layer="4037" to-port="1" /> + <edge from-layer="3983" from-port="0" to-layer="3988" to-port="0" /> + <edge from-layer="3984" from-port="0" to-layer="3987" to-port="1" /> + <edge from-layer="3985" from-port="0" to-layer="3987" to-port="2" /> + <edge from-layer="3986" from-port="0" to-layer="3987" to-port="3" /> + <edge from-layer="3987" from-port="4" to-layer="3988" to-port="1" /> + <edge from-layer="3988" from-port="2" to-layer="3989" to-port="0" /> + <edge from-layer="3989" from-port="1" to-layer="3991" to-port="0" /> + <edge from-layer="3990" from-port="0" to-layer="3991" to-port="2" /> + <edge from-layer="3991" from-port="3" to-layer="4010" to-port="0" /> + <edge from-layer="3992" from-port="0" to-layer="3993" to-port="0" /> + <edge from-layer="3993" from-port="1" to-layer="3996" to-port="0" /> + <edge from-layer="3994" from-port="0" to-layer="3995" to-port="0" /> + <edge from-layer="3995" from-port="1" to-layer="3996" to-port="1" /> + <edge from-layer="3996" from-port="2" to-layer="3998" to-port="0" /> + <edge from-layer="3997" from-port="0" to-layer="3998" to-port="1" /> + <edge from-layer="3998" from-port="2" to-layer="4000" to-port="0" /> + <edge from-layer="3999" from-port="0" to-layer="4000" to-port="1" /> + <edge from-layer="4000" from-port="2" to-layer="4001" to-port="0" /> + <edge from-layer="4001" from-port="1" to-layer="4002" to-port="1" /> + <edge from-layer="4002" from-port="2" to-layer="4005" to-port="0" /> + <edge from-layer="4003" from-port="0" to-layer="4004" to-port="0" /> + <edge from-layer="4004" from-port="1" to-layer="4005" to-port="1" /> + <edge from-layer="4005" from-port="2" to-layer="4007" to-port="0" /> + <edge from-layer="4006" from-port="0" to-layer="4007" to-port="1" /> + <edge from-layer="4007" from-port="2" to-layer="4009" to-port="0" /> + <edge from-layer="4008" from-port="0" to-layer="4009" to-port="1" /> + <edge from-layer="4009" from-port="2" to-layer="4010" to-port="1" /> + <edge from-layer="4010" from-port="2" to-layer="4012" to-port="0" /> + <edge from-layer="4010" from-port="2" to-layer="4011" to-port="0" /> + <edge from-layer="4010" from-port="2" to-layer="11209" to-port="0" /> + <edge from-layer="4011" from-port="2" to-layer="4021" to-port="0" /> + <edge from-layer="4012" from-port="1" to-layer="4015" to-port="0" /> + <edge from-layer="4012" from-port="1" to-layer="4019" to-port="0" /> + <edge from-layer="4013" from-port="0" to-layer="4015" to-port="1" /> + <edge from-layer="4014" from-port="0" to-layer="4015" to-port="2" /> + <edge from-layer="4015" from-port="3" to-layer="4020" to-port="1" /> + <edge from-layer="4016" from-port="0" to-layer="4020" to-port="2" /> + <edge from-layer="4017" from-port="0" to-layer="4019" to-port="1" /> + <edge from-layer="4018" from-port="0" to-layer="4019" to-port="2" /> + <edge from-layer="4019" from-port="3" to-layer="4020" to-port="3" /> + <edge from-layer="4020" from-port="4" to-layer="4021" to-port="1" /> + <edge from-layer="4021" from-port="2" to-layer="4023" to-port="0" /> + <edge from-layer="4022" from-port="0" to-layer="4023" to-port="1" /> + <edge from-layer="4023" from-port="2" to-layer="4037" to-port="2" /> + <edge from-layer="4024" from-port="0" to-layer="4036" to-port="1" /> + <edge from-layer="4025" from-port="1" to-layer="4028" to-port="0" /> + <edge from-layer="4026" from-port="0" to-layer="4028" to-port="1" /> + <edge from-layer="4027" from-port="0" to-layer="4028" to-port="2" /> + <edge from-layer="4028" from-port="3" to-layer="4033" to-port="0" /> + <edge from-layer="4029" from-port="1" to-layer="4032" to-port="0" /> + <edge from-layer="4030" from-port="0" to-layer="4032" to-port="1" /> + <edge from-layer="4031" from-port="0" to-layer="4032" to-port="2" /> + <edge from-layer="4032" from-port="3" to-layer="4033" to-port="1" /> + <edge from-layer="4033" from-port="2" to-layer="4036" to-port="2" /> + <edge from-layer="4034" from-port="0" to-layer="4036" to-port="3" /> + <edge from-layer="4035" from-port="0" to-layer="4036" to-port="4" /> + <edge from-layer="4036" from-port="5" to-layer="4037" to-port="3" /> + <edge from-layer="4037" from-port="4" to-layer="4039" to-port="0" /> + <edge from-layer="4038" from-port="0" to-layer="4039" to-port="1" /> + <edge from-layer="4039" from-port="2" to-layer="4041" to-port="0" /> + <edge from-layer="4040" from-port="0" to-layer="4041" to-port="1" /> + <edge from-layer="4041" from-port="2" to-layer="4052" to-port="0" /> + <edge from-layer="4042" from-port="0" to-layer="4043" to-port="0" /> + <edge from-layer="4043" from-port="1" to-layer="4046" to-port="0" /> + <edge from-layer="4044" from-port="0" to-layer="4045" to-port="0" /> + <edge from-layer="4045" from-port="1" to-layer="4046" to-port="1" /> + <edge from-layer="4046" from-port="2" to-layer="4048" to-port="0" /> + <edge from-layer="4047" from-port="0" to-layer="4048" to-port="1" /> + <edge from-layer="4048" from-port="2" to-layer="4050" to-port="0" /> + <edge from-layer="4049" from-port="0" to-layer="4050" to-port="1" /> + <edge from-layer="4050" from-port="2" to-layer="4051" to-port="0" /> + <edge from-layer="4051" from-port="1" to-layer="4052" to-port="1" /> + <edge from-layer="4052" from-port="2" to-layer="4053" to-port="1" /> + <edge from-layer="4053" from-port="2" to-layer="4101" to-port="0" /> + <edge from-layer="4053" from-port="2" to-layer="4064" to-port="0" /> + <edge from-layer="4053" from-port="2" to-layer="4057" to-port="0" /> + <edge from-layer="4054" from-port="0" to-layer="4065" to-port="0" /> + <edge from-layer="4055" from-port="0" to-layer="4063" to-port="0" /> + <edge from-layer="4056" from-port="0" to-layer="4057" to-port="1" /> + <edge from-layer="4057" from-port="2" to-layer="4059" to-port="0" /> + <edge from-layer="4058" from-port="0" to-layer="4059" to-port="1" /> + <edge from-layer="4059" from-port="2" to-layer="4061" to-port="0" /> + <edge from-layer="4060" from-port="0" to-layer="4061" to-port="1" /> + <edge from-layer="4061" from-port="2" to-layer="4062" to-port="0" /> + <edge from-layer="4062" from-port="1" to-layer="4063" to-port="1" /> + <edge from-layer="4063" from-port="2" to-layer="4064" to-port="1" /> + <edge from-layer="4064" from-port="2" to-layer="4065" to-port="1" /> + <edge from-layer="4065" from-port="2" to-layer="4088" to-port="0" /> + <edge from-layer="4065" from-port="2" to-layer="4076" to-port="0" /> + <edge from-layer="4066" from-port="0" to-layer="4067" to-port="0" /> + <edge from-layer="4067" from-port="1" to-layer="4070" to-port="0" /> + <edge from-layer="4068" from-port="0" to-layer="4069" to-port="0" /> + <edge from-layer="4069" from-port="1" to-layer="4070" to-port="1" /> + <edge from-layer="4070" from-port="2" to-layer="4072" to-port="0" /> + <edge from-layer="4071" from-port="0" to-layer="4072" to-port="1" /> + <edge from-layer="4072" from-port="2" to-layer="4074" to-port="0" /> + <edge from-layer="4073" from-port="0" to-layer="4074" to-port="1" /> + <edge from-layer="4074" from-port="2" to-layer="4075" to-port="0" /> + <edge from-layer="4075" from-port="1" to-layer="4076" to-port="1" /> + <edge from-layer="4076" from-port="2" to-layer="4077" to-port="0" /> + <edge from-layer="4077" from-port="1" to-layer="4089" to-port="0" /> + <edge from-layer="4078" from-port="0" to-layer="4079" to-port="0" /> + <edge from-layer="4079" from-port="1" to-layer="4082" to-port="0" /> + <edge from-layer="4080" from-port="0" to-layer="4081" to-port="0" /> + <edge from-layer="4081" from-port="1" to-layer="4082" to-port="1" /> + <edge from-layer="4082" from-port="2" to-layer="4084" to-port="0" /> + <edge from-layer="4083" from-port="0" to-layer="4084" to-port="1" /> + <edge from-layer="4084" from-port="2" to-layer="4086" to-port="0" /> + <edge from-layer="4085" from-port="0" to-layer="4086" to-port="1" /> + <edge from-layer="4086" from-port="2" to-layer="4087" to-port="0" /> + <edge from-layer="4087" from-port="1" to-layer="4088" to-port="1" /> + <edge from-layer="4088" from-port="2" to-layer="4089" to-port="1" /> + <edge from-layer="4089" from-port="2" to-layer="4100" to-port="0" /> + <edge from-layer="4090" from-port="0" to-layer="4091" to-port="0" /> + <edge from-layer="4091" from-port="1" to-layer="4094" to-port="0" /> + <edge from-layer="4092" from-port="0" to-layer="4093" to-port="0" /> + <edge from-layer="4093" from-port="1" to-layer="4094" to-port="1" /> + <edge from-layer="4094" from-port="2" to-layer="4096" to-port="0" /> + <edge from-layer="4095" from-port="0" to-layer="4096" to-port="1" /> + <edge from-layer="4096" from-port="2" to-layer="4098" to-port="0" /> + <edge from-layer="4097" from-port="0" to-layer="4098" to-port="1" /> + <edge from-layer="4098" from-port="2" to-layer="4099" to-port="0" /> + <edge from-layer="4099" from-port="1" to-layer="4100" to-port="1" /> + <edge from-layer="4100" from-port="2" to-layer="4101" to-port="1" /> + <edge from-layer="4101" from-port="2" to-layer="4105" to-port="0" /> + <edge from-layer="4101" from-port="2" to-layer="4285" to-port="0" /> + <edge from-layer="4101" from-port="2" to-layer="4112" to-port="0" /> + <edge from-layer="4102" from-port="0" to-layer="4113" to-port="0" /> + <edge from-layer="4103" from-port="0" to-layer="4111" to-port="0" /> + <edge from-layer="4104" from-port="0" to-layer="4105" to-port="1" /> + <edge from-layer="4105" from-port="2" to-layer="4107" to-port="0" /> + <edge from-layer="4106" from-port="0" to-layer="4107" to-port="1" /> + <edge from-layer="4107" from-port="2" to-layer="4109" to-port="0" /> + <edge from-layer="4108" from-port="0" to-layer="4109" to-port="1" /> + <edge from-layer="4109" from-port="2" to-layer="4110" to-port="0" /> + <edge from-layer="4110" from-port="1" to-layer="4111" to-port="1" /> + <edge from-layer="4111" from-port="2" to-layer="4112" to-port="1" /> + <edge from-layer="4112" from-port="2" to-layer="4113" to-port="1" /> + <edge from-layer="4113" from-port="2" to-layer="4234" to-port="0" /> + <edge from-layer="4113" from-port="2" to-layer="4124" to-port="0" /> + <edge from-layer="4113" from-port="2" to-layer="4172" to-port="0" /> + <edge from-layer="4114" from-port="0" to-layer="4115" to-port="0" /> + <edge from-layer="4115" from-port="1" to-layer="4118" to-port="0" /> + <edge from-layer="4116" from-port="0" to-layer="4117" to-port="0" /> + <edge from-layer="4117" from-port="1" to-layer="4118" to-port="1" /> + <edge from-layer="4118" from-port="2" to-layer="4120" to-port="0" /> + <edge from-layer="4119" from-port="0" to-layer="4120" to-port="1" /> + <edge from-layer="4120" from-port="2" to-layer="4122" to-port="0" /> + <edge from-layer="4121" from-port="0" to-layer="4122" to-port="1" /> + <edge from-layer="4122" from-port="2" to-layer="4123" to-port="0" /> + <edge from-layer="4123" from-port="1" to-layer="4124" to-port="1" /> + <edge from-layer="4124" from-port="2" to-layer="4127" to-port="0" /> + <edge from-layer="4125" from-port="0" to-layer="4126" to-port="0" /> + <edge from-layer="4126" from-port="1" to-layer="4127" to-port="1" /> + <edge from-layer="4127" from-port="2" to-layer="4129" to-port="0" /> + <edge from-layer="4128" from-port="0" to-layer="4129" to-port="1" /> + <edge from-layer="4129" from-port="2" to-layer="4131" to-port="0" /> + <edge from-layer="4130" from-port="0" to-layer="4131" to-port="1" /> + <edge from-layer="4131" from-port="2" to-layer="4132" to-port="0" /> + <edge from-layer="4131" from-port="2" to-layer="4133" to-port="0" /> + <edge from-layer="4131" from-port="2" to-layer="4149" to-port="0" /> + <edge from-layer="4131" from-port="2" to-layer="4143" to-port="0" /> + <edge from-layer="4132" from-port="2" to-layer="4152" to-port="0" /> + <edge from-layer="4133" from-port="1" to-layer="4135" to-port="0" /> + <edge from-layer="4134" from-port="0" to-layer="4135" to-port="2" /> + <edge from-layer="4135" from-port="3" to-layer="4136" to-port="0" /> + <edge from-layer="4136" from-port="2" to-layer="4137" to-port="0" /> + <edge from-layer="4137" from-port="1" to-layer="4139" to-port="0" /> + <edge from-layer="4138" from-port="0" to-layer="4139" to-port="1" /> + <edge from-layer="4139" from-port="2" to-layer="4149" to-port="2" /> + <edge from-layer="4139" from-port="2" to-layer="4143" to-port="1" /> + <edge from-layer="4140" from-port="0" to-layer="4143" to-port="2" /> + <edge from-layer="4141" from-port="0" to-layer="4143" to-port="3" /> + <edge from-layer="4142" from-port="0" to-layer="4143" to-port="4" /> + <edge from-layer="4143" from-port="5" to-layer="4145" to-port="0" /> + <edge from-layer="4144" from-port="0" to-layer="4145" to-port="1" /> + <edge from-layer="4145" from-port="2" to-layer="4150" to-port="0" /> + <edge from-layer="4146" from-port="0" to-layer="4149" to-port="1" /> + <edge from-layer="4147" from-port="0" to-layer="4149" to-port="3" /> + <edge from-layer="4148" from-port="0" to-layer="4149" to-port="4" /> + <edge from-layer="4149" from-port="5" to-layer="4150" to-port="1" /> + <edge from-layer="4150" from-port="2" to-layer="4151" to-port="0" /> + <edge from-layer="4151" from-port="2" to-layer="4152" to-port="1" /> + <edge from-layer="4152" from-port="2" to-layer="4269" to-port="0" /> + <edge from-layer="4153" from-port="0" to-layer="4158" to-port="0" /> + <edge from-layer="4154" from-port="0" to-layer="4157" to-port="1" /> + <edge from-layer="4155" from-port="0" to-layer="4157" to-port="2" /> + <edge from-layer="4156" from-port="0" to-layer="4157" to-port="3" /> + <edge from-layer="4157" from-port="4" to-layer="4158" to-port="1" /> + <edge from-layer="4158" from-port="2" to-layer="4159" to-port="0" /> + <edge from-layer="4159" from-port="1" to-layer="4161" to-port="0" /> + <edge from-layer="4160" from-port="0" to-layer="4161" to-port="2" /> + <edge from-layer="4161" from-port="3" to-layer="4201" to-port="0" /> + <edge from-layer="4161" from-port="3" to-layer="4257" to-port="0" /> + <edge from-layer="4162" from-port="0" to-layer="4163" to-port="0" /> + <edge from-layer="4163" from-port="1" to-layer="4166" to-port="0" /> + <edge from-layer="4164" from-port="0" to-layer="4165" to-port="0" /> + <edge from-layer="4165" from-port="1" to-layer="4166" to-port="1" /> + <edge from-layer="4166" from-port="2" to-layer="4168" to-port="0" /> + <edge from-layer="4167" from-port="0" to-layer="4168" to-port="1" /> + <edge from-layer="4168" from-port="2" to-layer="4170" to-port="0" /> + <edge from-layer="4169" from-port="0" to-layer="4170" to-port="1" /> + <edge from-layer="4170" from-port="2" to-layer="4171" to-port="0" /> + <edge from-layer="4171" from-port="1" to-layer="4172" to-port="1" /> + <edge from-layer="4172" from-port="2" to-layer="4175" to-port="0" /> + <edge from-layer="4173" from-port="0" to-layer="4174" to-port="0" /> + <edge from-layer="4174" from-port="1" to-layer="4175" to-port="1" /> + <edge from-layer="4175" from-port="2" to-layer="4177" to-port="0" /> + <edge from-layer="4176" from-port="0" to-layer="4177" to-port="1" /> + <edge from-layer="4177" from-port="2" to-layer="4179" to-port="0" /> + <edge from-layer="4178" from-port="0" to-layer="4179" to-port="1" /> + <edge from-layer="4179" from-port="2" to-layer="4197" to-port="0" /> + <edge from-layer="4179" from-port="2" to-layer="4191" to-port="0" /> + <edge from-layer="4179" from-port="2" to-layer="4181" to-port="0" /> + <edge from-layer="4179" from-port="2" to-layer="4180" to-port="0" /> + <edge from-layer="4180" from-port="2" to-layer="4200" to-port="0" /> + <edge from-layer="4181" from-port="1" to-layer="4183" to-port="0" /> + <edge from-layer="4182" from-port="0" to-layer="4183" to-port="2" /> + <edge from-layer="4183" from-port="3" to-layer="4184" to-port="0" /> + <edge from-layer="4184" from-port="2" to-layer="4185" to-port="0" /> + <edge from-layer="4185" from-port="1" to-layer="4187" to-port="0" /> + <edge from-layer="4186" from-port="0" to-layer="4187" to-port="1" /> + <edge from-layer="4187" from-port="2" to-layer="4197" to-port="2" /> + <edge from-layer="4187" from-port="2" to-layer="4191" to-port="1" /> + <edge from-layer="4188" from-port="0" to-layer="4191" to-port="2" /> + <edge from-layer="4189" from-port="0" to-layer="4191" to-port="3" /> + <edge from-layer="4190" from-port="0" to-layer="4191" to-port="4" /> + <edge from-layer="4191" from-port="5" to-layer="4193" to-port="0" /> + <edge from-layer="4192" from-port="0" to-layer="4193" to-port="1" /> + <edge from-layer="4193" from-port="2" to-layer="4198" to-port="0" /> + <edge from-layer="4194" from-port="0" to-layer="4197" to-port="1" /> + <edge from-layer="4195" from-port="0" to-layer="4197" to-port="3" /> + <edge from-layer="4196" from-port="0" to-layer="4197" to-port="4" /> + <edge from-layer="4197" from-port="5" to-layer="4198" to-port="1" /> + <edge from-layer="4198" from-port="2" to-layer="4199" to-port="0" /> + <edge from-layer="4199" from-port="2" to-layer="4200" to-port="1" /> + <edge from-layer="4200" from-port="2" to-layer="4201" to-port="1" /> + <edge from-layer="4200" from-port="2" to-layer="4261" to-port="0" /> + <edge from-layer="4201" from-port="2" to-layer="4202" to-port="0" /> + <edge from-layer="4201" from-port="2" to-layer="4203" to-port="0" /> + <edge from-layer="4201" from-port="2" to-layer="11208" to-port="0" /> + <edge from-layer="4202" from-port="2" to-layer="4212" to-port="0" /> + <edge from-layer="4203" from-port="1" to-layer="4206" to-port="0" /> + <edge from-layer="4203" from-port="1" to-layer="4210" to-port="0" /> + <edge from-layer="4204" from-port="0" to-layer="4206" to-port="1" /> + <edge from-layer="4205" from-port="0" to-layer="4206" to-port="2" /> + <edge from-layer="4206" from-port="3" to-layer="4211" to-port="0" /> + <edge from-layer="4207" from-port="0" to-layer="4211" to-port="1" /> + <edge from-layer="4208" from-port="0" to-layer="4210" to-port="1" /> + <edge from-layer="4209" from-port="0" to-layer="4210" to-port="2" /> + <edge from-layer="4210" from-port="3" to-layer="4211" to-port="2" /> + <edge from-layer="4211" from-port="3" to-layer="4212" to-port="1" /> + <edge from-layer="4212" from-port="2" to-layer="4214" to-port="0" /> + <edge from-layer="4213" from-port="0" to-layer="4214" to-port="1" /> + <edge from-layer="4214" from-port="2" to-layer="4269" to-port="1" /> + <edge from-layer="4215" from-port="0" to-layer="4220" to-port="0" /> + <edge from-layer="4216" from-port="0" to-layer="4219" to-port="1" /> + <edge from-layer="4217" from-port="0" to-layer="4219" to-port="2" /> + <edge from-layer="4218" from-port="0" to-layer="4219" to-port="3" /> + <edge from-layer="4219" from-port="4" to-layer="4220" to-port="1" /> + <edge from-layer="4220" from-port="2" to-layer="4221" to-port="0" /> + <edge from-layer="4221" from-port="1" to-layer="4223" to-port="0" /> + <edge from-layer="4222" from-port="0" to-layer="4223" to-port="2" /> + <edge from-layer="4223" from-port="3" to-layer="4242" to-port="0" /> + <edge from-layer="4224" from-port="0" to-layer="4225" to-port="0" /> + <edge from-layer="4225" from-port="1" to-layer="4228" to-port="0" /> + <edge from-layer="4226" from-port="0" to-layer="4227" to-port="0" /> + <edge from-layer="4227" from-port="1" to-layer="4228" to-port="1" /> + <edge from-layer="4228" from-port="2" to-layer="4230" to-port="0" /> + <edge from-layer="4229" from-port="0" to-layer="4230" to-port="1" /> + <edge from-layer="4230" from-port="2" to-layer="4232" to-port="0" /> + <edge from-layer="4231" from-port="0" to-layer="4232" to-port="1" /> + <edge from-layer="4232" from-port="2" to-layer="4233" to-port="0" /> + <edge from-layer="4233" from-port="1" to-layer="4234" to-port="1" /> + <edge from-layer="4234" from-port="2" to-layer="4237" to-port="0" /> + <edge from-layer="4235" from-port="0" to-layer="4236" to-port="0" /> + <edge from-layer="4236" from-port="1" to-layer="4237" to-port="1" /> + <edge from-layer="4237" from-port="2" to-layer="4239" to-port="0" /> + <edge from-layer="4238" from-port="0" to-layer="4239" to-port="1" /> + <edge from-layer="4239" from-port="2" to-layer="4241" to-port="0" /> + <edge from-layer="4240" from-port="0" to-layer="4241" to-port="1" /> + <edge from-layer="4241" from-port="2" to-layer="4242" to-port="1" /> + <edge from-layer="4242" from-port="2" to-layer="11207" to-port="0" /> + <edge from-layer="4242" from-port="2" to-layer="4243" to-port="0" /> + <edge from-layer="4242" from-port="2" to-layer="4244" to-port="0" /> + <edge from-layer="4243" from-port="2" to-layer="4253" to-port="0" /> + <edge from-layer="4244" from-port="1" to-layer="4251" to-port="0" /> + <edge from-layer="4244" from-port="1" to-layer="4247" to-port="0" /> + <edge from-layer="4245" from-port="0" to-layer="4247" to-port="1" /> + <edge from-layer="4246" from-port="0" to-layer="4247" to-port="2" /> + <edge from-layer="4247" from-port="3" to-layer="4252" to-port="1" /> + <edge from-layer="4248" from-port="0" to-layer="4252" to-port="2" /> + <edge from-layer="4249" from-port="0" to-layer="4251" to-port="1" /> + <edge from-layer="4250" from-port="0" to-layer="4251" to-port="2" /> + <edge from-layer="4251" from-port="3" to-layer="4252" to-port="3" /> + <edge from-layer="4252" from-port="4" to-layer="4253" to-port="1" /> + <edge from-layer="4253" from-port="2" to-layer="4255" to-port="0" /> + <edge from-layer="4254" from-port="0" to-layer="4255" to-port="1" /> + <edge from-layer="4255" from-port="2" to-layer="4269" to-port="2" /> + <edge from-layer="4256" from-port="0" to-layer="4268" to-port="1" /> + <edge from-layer="4257" from-port="1" to-layer="4260" to-port="0" /> + <edge from-layer="4258" from-port="0" to-layer="4260" to-port="1" /> + <edge from-layer="4259" from-port="0" to-layer="4260" to-port="2" /> + <edge from-layer="4260" from-port="3" to-layer="4265" to-port="0" /> + <edge from-layer="4261" from-port="1" to-layer="4264" to-port="0" /> + <edge from-layer="4262" from-port="0" to-layer="4264" to-port="1" /> + <edge from-layer="4263" from-port="0" to-layer="4264" to-port="2" /> + <edge from-layer="4264" from-port="3" to-layer="4265" to-port="1" /> + <edge from-layer="4265" from-port="2" to-layer="4268" to-port="2" /> + <edge from-layer="4266" from-port="0" to-layer="4268" to-port="3" /> + <edge from-layer="4267" from-port="0" to-layer="4268" to-port="4" /> + <edge from-layer="4268" from-port="5" to-layer="4269" to-port="3" /> + <edge from-layer="4269" from-port="4" to-layer="4271" to-port="0" /> + <edge from-layer="4270" from-port="0" to-layer="4271" to-port="1" /> + <edge from-layer="4271" from-port="2" to-layer="4273" to-port="0" /> + <edge from-layer="4272" from-port="0" to-layer="4273" to-port="1" /> + <edge from-layer="4273" from-port="2" to-layer="4284" to-port="0" /> + <edge from-layer="4274" from-port="0" to-layer="4275" to-port="0" /> + <edge from-layer="4275" from-port="1" to-layer="4278" to-port="0" /> + <edge from-layer="4276" from-port="0" to-layer="4277" to-port="0" /> + <edge from-layer="4277" from-port="1" to-layer="4278" to-port="1" /> + <edge from-layer="4278" from-port="2" to-layer="4280" to-port="0" /> + <edge from-layer="4279" from-port="0" to-layer="4280" to-port="1" /> + <edge from-layer="4280" from-port="2" to-layer="4282" to-port="0" /> + <edge from-layer="4281" from-port="0" to-layer="4282" to-port="1" /> + <edge from-layer="4282" from-port="2" to-layer="4283" to-port="0" /> + <edge from-layer="4283" from-port="1" to-layer="4284" to-port="1" /> + <edge from-layer="4284" from-port="2" to-layer="4285" to-port="1" /> + <edge from-layer="4285" from-port="2" to-layer="4296" to-port="0" /> + <edge from-layer="4285" from-port="2" to-layer="4333" to-port="0" /> + <edge from-layer="4285" from-port="2" to-layer="4289" to-port="0" /> + <edge from-layer="4286" from-port="0" to-layer="4297" to-port="0" /> + <edge from-layer="4287" from-port="0" to-layer="4295" to-port="0" /> + <edge from-layer="4288" from-port="0" to-layer="4289" to-port="1" /> + <edge from-layer="4289" from-port="2" to-layer="4291" to-port="0" /> + <edge from-layer="4290" from-port="0" to-layer="4291" to-port="1" /> + <edge from-layer="4291" from-port="2" to-layer="4293" to-port="0" /> + <edge from-layer="4292" from-port="0" to-layer="4293" to-port="1" /> + <edge from-layer="4293" from-port="2" to-layer="4294" to-port="0" /> + <edge from-layer="4294" from-port="1" to-layer="4295" to-port="1" /> + <edge from-layer="4295" from-port="2" to-layer="4296" to-port="1" /> + <edge from-layer="4296" from-port="2" to-layer="4297" to-port="1" /> + <edge from-layer="4297" from-port="2" to-layer="4320" to-port="0" /> + <edge from-layer="4297" from-port="2" to-layer="4308" to-port="0" /> + <edge from-layer="4298" from-port="0" to-layer="4299" to-port="0" /> + <edge from-layer="4299" from-port="1" to-layer="4302" to-port="0" /> + <edge from-layer="4300" from-port="0" to-layer="4301" to-port="0" /> + <edge from-layer="4301" from-port="1" to-layer="4302" to-port="1" /> + <edge from-layer="4302" from-port="2" to-layer="4304" to-port="0" /> + <edge from-layer="4303" from-port="0" to-layer="4304" to-port="1" /> + <edge from-layer="4304" from-port="2" to-layer="4306" to-port="0" /> + <edge from-layer="4305" from-port="0" to-layer="4306" to-port="1" /> + <edge from-layer="4306" from-port="2" to-layer="4307" to-port="0" /> + <edge from-layer="4307" from-port="1" to-layer="4308" to-port="1" /> + <edge from-layer="4308" from-port="2" to-layer="4309" to-port="0" /> + <edge from-layer="4309" from-port="1" to-layer="4321" to-port="0" /> + <edge from-layer="4310" from-port="0" to-layer="4311" to-port="0" /> + <edge from-layer="4311" from-port="1" to-layer="4314" to-port="0" /> + <edge from-layer="4312" from-port="0" to-layer="4313" to-port="0" /> + <edge from-layer="4313" from-port="1" to-layer="4314" to-port="1" /> + <edge from-layer="4314" from-port="2" to-layer="4316" to-port="0" /> + <edge from-layer="4315" from-port="0" to-layer="4316" to-port="1" /> + <edge from-layer="4316" from-port="2" to-layer="4318" to-port="0" /> + <edge from-layer="4317" from-port="0" to-layer="4318" to-port="1" /> + <edge from-layer="4318" from-port="2" to-layer="4319" to-port="0" /> + <edge from-layer="4319" from-port="1" to-layer="4320" to-port="1" /> + <edge from-layer="4320" from-port="2" to-layer="4321" to-port="1" /> + <edge from-layer="4321" from-port="2" to-layer="4332" to-port="0" /> + <edge from-layer="4322" from-port="0" to-layer="4323" to-port="0" /> + <edge from-layer="4323" from-port="1" to-layer="4326" to-port="0" /> + <edge from-layer="4324" from-port="0" to-layer="4325" to-port="0" /> + <edge from-layer="4325" from-port="1" to-layer="4326" to-port="1" /> + <edge from-layer="4326" from-port="2" to-layer="4328" to-port="0" /> + <edge from-layer="4327" from-port="0" to-layer="4328" to-port="1" /> + <edge from-layer="4328" from-port="2" to-layer="4330" to-port="0" /> + <edge from-layer="4329" from-port="0" to-layer="4330" to-port="1" /> + <edge from-layer="4330" from-port="2" to-layer="4331" to-port="0" /> + <edge from-layer="4331" from-port="1" to-layer="4332" to-port="1" /> + <edge from-layer="4332" from-port="2" to-layer="4333" to-port="1" /> + <edge from-layer="4333" from-port="2" to-layer="4337" to-port="0" /> + <edge from-layer="4333" from-port="2" to-layer="4344" to-port="0" /> + <edge from-layer="4333" from-port="2" to-layer="4517" to-port="0" /> + <edge from-layer="4334" from-port="0" to-layer="4345" to-port="0" /> + <edge from-layer="4335" from-port="0" to-layer="4343" to-port="0" /> + <edge from-layer="4336" from-port="0" to-layer="4337" to-port="1" /> + <edge from-layer="4337" from-port="2" to-layer="4339" to-port="0" /> + <edge from-layer="4338" from-port="0" to-layer="4339" to-port="1" /> + <edge from-layer="4339" from-port="2" to-layer="4341" to-port="0" /> + <edge from-layer="4340" from-port="0" to-layer="4341" to-port="1" /> + <edge from-layer="4341" from-port="2" to-layer="4342" to-port="0" /> + <edge from-layer="4342" from-port="1" to-layer="4343" to-port="1" /> + <edge from-layer="4343" from-port="2" to-layer="4344" to-port="1" /> + <edge from-layer="4344" from-port="2" to-layer="4345" to-port="1" /> + <edge from-layer="4345" from-port="2" to-layer="4356" to-port="0" /> + <edge from-layer="4345" from-port="2" to-layer="4466" to-port="0" /> + <edge from-layer="4345" from-port="2" to-layer="4404" to-port="0" /> + <edge from-layer="4346" from-port="0" to-layer="4347" to-port="0" /> + <edge from-layer="4347" from-port="1" to-layer="4350" to-port="0" /> + <edge from-layer="4348" from-port="0" to-layer="4349" to-port="0" /> + <edge from-layer="4349" from-port="1" to-layer="4350" to-port="1" /> + <edge from-layer="4350" from-port="2" to-layer="4352" to-port="0" /> + <edge from-layer="4351" from-port="0" to-layer="4352" to-port="1" /> + <edge from-layer="4352" from-port="2" to-layer="4354" to-port="0" /> + <edge from-layer="4353" from-port="0" to-layer="4354" to-port="1" /> + <edge from-layer="4354" from-port="2" to-layer="4355" to-port="0" /> + <edge from-layer="4355" from-port="1" to-layer="4356" to-port="1" /> + <edge from-layer="4356" from-port="2" to-layer="4359" to-port="0" /> + <edge from-layer="4357" from-port="0" to-layer="4358" to-port="0" /> + <edge from-layer="4358" from-port="1" to-layer="4359" to-port="1" /> + <edge from-layer="4359" from-port="2" to-layer="4361" to-port="0" /> + <edge from-layer="4360" from-port="0" to-layer="4361" to-port="1" /> + <edge from-layer="4361" from-port="2" to-layer="4363" to-port="0" /> + <edge from-layer="4362" from-port="0" to-layer="4363" to-port="1" /> + <edge from-layer="4363" from-port="2" to-layer="4375" to-port="0" /> + <edge from-layer="4363" from-port="2" to-layer="4381" to-port="0" /> + <edge from-layer="4363" from-port="2" to-layer="4364" to-port="0" /> + <edge from-layer="4363" from-port="2" to-layer="4365" to-port="0" /> + <edge from-layer="4364" from-port="2" to-layer="4384" to-port="0" /> + <edge from-layer="4365" from-port="1" to-layer="4367" to-port="0" /> + <edge from-layer="4366" from-port="0" to-layer="4367" to-port="2" /> + <edge from-layer="4367" from-port="3" to-layer="4368" to-port="0" /> + <edge from-layer="4368" from-port="2" to-layer="4369" to-port="0" /> + <edge from-layer="4369" from-port="1" to-layer="4371" to-port="0" /> + <edge from-layer="4370" from-port="0" to-layer="4371" to-port="1" /> + <edge from-layer="4371" from-port="2" to-layer="4381" to-port="2" /> + <edge from-layer="4371" from-port="2" to-layer="4375" to-port="1" /> + <edge from-layer="4372" from-port="0" to-layer="4375" to-port="2" /> + <edge from-layer="4373" from-port="0" to-layer="4375" to-port="3" /> + <edge from-layer="4374" from-port="0" to-layer="4375" to-port="4" /> + <edge from-layer="4375" from-port="5" to-layer="4377" to-port="0" /> + <edge from-layer="4376" from-port="0" to-layer="4377" to-port="1" /> + <edge from-layer="4377" from-port="2" to-layer="4382" to-port="0" /> + <edge from-layer="4378" from-port="0" to-layer="4381" to-port="1" /> + <edge from-layer="4379" from-port="0" to-layer="4381" to-port="3" /> + <edge from-layer="4380" from-port="0" to-layer="4381" to-port="4" /> + <edge from-layer="4381" from-port="5" to-layer="4382" to-port="1" /> + <edge from-layer="4382" from-port="2" to-layer="4383" to-port="0" /> + <edge from-layer="4383" from-port="2" to-layer="4384" to-port="1" /> + <edge from-layer="4384" from-port="2" to-layer="4501" to-port="0" /> + <edge from-layer="4385" from-port="0" to-layer="4390" to-port="0" /> + <edge from-layer="4386" from-port="0" to-layer="4389" to-port="1" /> + <edge from-layer="4387" from-port="0" to-layer="4389" to-port="2" /> + <edge from-layer="4388" from-port="0" to-layer="4389" to-port="3" /> + <edge from-layer="4389" from-port="4" to-layer="4390" to-port="1" /> + <edge from-layer="4390" from-port="2" to-layer="4391" to-port="0" /> + <edge from-layer="4391" from-port="1" to-layer="4393" to-port="0" /> + <edge from-layer="4392" from-port="0" to-layer="4393" to-port="2" /> + <edge from-layer="4393" from-port="3" to-layer="4489" to-port="0" /> + <edge from-layer="4393" from-port="3" to-layer="4433" to-port="0" /> + <edge from-layer="4394" from-port="0" to-layer="4395" to-port="0" /> + <edge from-layer="4395" from-port="1" to-layer="4398" to-port="0" /> + <edge from-layer="4396" from-port="0" to-layer="4397" to-port="0" /> + <edge from-layer="4397" from-port="1" to-layer="4398" to-port="1" /> + <edge from-layer="4398" from-port="2" to-layer="4400" to-port="0" /> + <edge from-layer="4399" from-port="0" to-layer="4400" to-port="1" /> + <edge from-layer="4400" from-port="2" to-layer="4402" to-port="0" /> + <edge from-layer="4401" from-port="0" to-layer="4402" to-port="1" /> + <edge from-layer="4402" from-port="2" to-layer="4403" to-port="0" /> + <edge from-layer="4403" from-port="1" to-layer="4404" to-port="1" /> + <edge from-layer="4404" from-port="2" to-layer="4407" to-port="0" /> + <edge from-layer="4405" from-port="0" to-layer="4406" to-port="0" /> + <edge from-layer="4406" from-port="1" to-layer="4407" to-port="1" /> + <edge from-layer="4407" from-port="2" to-layer="4409" to-port="0" /> + <edge from-layer="4408" from-port="0" to-layer="4409" to-port="1" /> + <edge from-layer="4409" from-port="2" to-layer="4411" to-port="0" /> + <edge from-layer="4410" from-port="0" to-layer="4411" to-port="1" /> + <edge from-layer="4411" from-port="2" to-layer="4423" to-port="0" /> + <edge from-layer="4411" from-port="2" to-layer="4413" to-port="0" /> + <edge from-layer="4411" from-port="2" to-layer="4412" to-port="0" /> + <edge from-layer="4411" from-port="2" to-layer="4429" to-port="0" /> + <edge from-layer="4412" from-port="2" to-layer="4432" to-port="0" /> + <edge from-layer="4413" from-port="1" to-layer="4415" to-port="0" /> + <edge from-layer="4414" from-port="0" to-layer="4415" to-port="2" /> + <edge from-layer="4415" from-port="3" to-layer="4416" to-port="0" /> + <edge from-layer="4416" from-port="2" to-layer="4417" to-port="0" /> + <edge from-layer="4417" from-port="1" to-layer="4419" to-port="0" /> + <edge from-layer="4418" from-port="0" to-layer="4419" to-port="1" /> + <edge from-layer="4419" from-port="2" to-layer="4423" to-port="1" /> + <edge from-layer="4419" from-port="2" to-layer="4429" to-port="2" /> + <edge from-layer="4420" from-port="0" to-layer="4423" to-port="2" /> + <edge from-layer="4421" from-port="0" to-layer="4423" to-port="3" /> + <edge from-layer="4422" from-port="0" to-layer="4423" to-port="4" /> + <edge from-layer="4423" from-port="5" to-layer="4425" to-port="0" /> + <edge from-layer="4424" from-port="0" to-layer="4425" to-port="1" /> + <edge from-layer="4425" from-port="2" to-layer="4430" to-port="0" /> + <edge from-layer="4426" from-port="0" to-layer="4429" to-port="1" /> + <edge from-layer="4427" from-port="0" to-layer="4429" to-port="3" /> + <edge from-layer="4428" from-port="0" to-layer="4429" to-port="4" /> + <edge from-layer="4429" from-port="5" to-layer="4430" to-port="1" /> + <edge from-layer="4430" from-port="2" to-layer="4431" to-port="0" /> + <edge from-layer="4431" from-port="2" to-layer="4432" to-port="1" /> + <edge from-layer="4432" from-port="2" to-layer="4433" to-port="1" /> + <edge from-layer="4432" from-port="2" to-layer="4493" to-port="0" /> + <edge from-layer="4433" from-port="2" to-layer="4434" to-port="0" /> + <edge from-layer="4433" from-port="2" to-layer="11206" to-port="0" /> + <edge from-layer="4433" from-port="2" to-layer="4435" to-port="0" /> + <edge from-layer="4434" from-port="2" to-layer="4444" to-port="0" /> + <edge from-layer="4435" from-port="1" to-layer="4442" to-port="0" /> + <edge from-layer="4435" from-port="1" to-layer="4438" to-port="0" /> + <edge from-layer="4436" from-port="0" to-layer="4438" to-port="1" /> + <edge from-layer="4437" from-port="0" to-layer="4438" to-port="2" /> + <edge from-layer="4438" from-port="3" to-layer="4443" to-port="0" /> + <edge from-layer="4439" from-port="0" to-layer="4443" to-port="1" /> + <edge from-layer="4440" from-port="0" to-layer="4442" to-port="1" /> + <edge from-layer="4441" from-port="0" to-layer="4442" to-port="2" /> + <edge from-layer="4442" from-port="3" to-layer="4443" to-port="2" /> + <edge from-layer="4443" from-port="3" to-layer="4444" to-port="1" /> + <edge from-layer="4444" from-port="2" to-layer="4446" to-port="0" /> + <edge from-layer="4445" from-port="0" to-layer="4446" to-port="1" /> + <edge from-layer="4446" from-port="2" to-layer="4501" to-port="1" /> + <edge from-layer="4447" from-port="0" to-layer="4452" to-port="0" /> + <edge from-layer="4448" from-port="0" to-layer="4451" to-port="1" /> + <edge from-layer="4449" from-port="0" to-layer="4451" to-port="2" /> + <edge from-layer="4450" from-port="0" to-layer="4451" to-port="3" /> + <edge from-layer="4451" from-port="4" to-layer="4452" to-port="1" /> + <edge from-layer="4452" from-port="2" to-layer="4453" to-port="0" /> + <edge from-layer="4453" from-port="1" to-layer="4455" to-port="0" /> + <edge from-layer="4454" from-port="0" to-layer="4455" to-port="2" /> + <edge from-layer="4455" from-port="3" to-layer="4474" to-port="0" /> + <edge from-layer="4456" from-port="0" to-layer="4457" to-port="0" /> + <edge from-layer="4457" from-port="1" to-layer="4460" to-port="0" /> + <edge from-layer="4458" from-port="0" to-layer="4459" to-port="0" /> + <edge from-layer="4459" from-port="1" to-layer="4460" to-port="1" /> + <edge from-layer="4460" from-port="2" to-layer="4462" to-port="0" /> + <edge from-layer="4461" from-port="0" to-layer="4462" to-port="1" /> + <edge from-layer="4462" from-port="2" to-layer="4464" to-port="0" /> + <edge from-layer="4463" from-port="0" to-layer="4464" to-port="1" /> + <edge from-layer="4464" from-port="2" to-layer="4465" to-port="0" /> + <edge from-layer="4465" from-port="1" to-layer="4466" to-port="1" /> + <edge from-layer="4466" from-port="2" to-layer="4469" to-port="0" /> + <edge from-layer="4467" from-port="0" to-layer="4468" to-port="0" /> + <edge from-layer="4468" from-port="1" to-layer="4469" to-port="1" /> + <edge from-layer="4469" from-port="2" to-layer="4471" to-port="0" /> + <edge from-layer="4470" from-port="0" to-layer="4471" to-port="1" /> + <edge from-layer="4471" from-port="2" to-layer="4473" to-port="0" /> + <edge from-layer="4472" from-port="0" to-layer="4473" to-port="1" /> + <edge from-layer="4473" from-port="2" to-layer="4474" to-port="1" /> + <edge from-layer="4474" from-port="2" to-layer="11205" to-port="0" /> + <edge from-layer="4474" from-port="2" to-layer="4475" to-port="0" /> + <edge from-layer="4474" from-port="2" to-layer="4476" to-port="0" /> + <edge from-layer="4475" from-port="2" to-layer="4485" to-port="0" /> + <edge from-layer="4476" from-port="1" to-layer="4483" to-port="0" /> + <edge from-layer="4476" from-port="1" to-layer="4479" to-port="0" /> + <edge from-layer="4477" from-port="0" to-layer="4479" to-port="1" /> + <edge from-layer="4478" from-port="0" to-layer="4479" to-port="2" /> + <edge from-layer="4479" from-port="3" to-layer="4484" to-port="1" /> + <edge from-layer="4480" from-port="0" to-layer="4484" to-port="2" /> + <edge from-layer="4481" from-port="0" to-layer="4483" to-port="1" /> + <edge from-layer="4482" from-port="0" to-layer="4483" to-port="2" /> + <edge from-layer="4483" from-port="3" to-layer="4484" to-port="3" /> + <edge from-layer="4484" from-port="4" to-layer="4485" to-port="1" /> + <edge from-layer="4485" from-port="2" to-layer="4487" to-port="0" /> + <edge from-layer="4486" from-port="0" to-layer="4487" to-port="1" /> + <edge from-layer="4487" from-port="2" to-layer="4501" to-port="2" /> + <edge from-layer="4488" from-port="0" to-layer="4500" to-port="1" /> + <edge from-layer="4489" from-port="1" to-layer="4492" to-port="0" /> + <edge from-layer="4490" from-port="0" to-layer="4492" to-port="1" /> + <edge from-layer="4491" from-port="0" to-layer="4492" to-port="2" /> + <edge from-layer="4492" from-port="3" to-layer="4497" to-port="0" /> + <edge from-layer="4493" from-port="1" to-layer="4496" to-port="0" /> + <edge from-layer="4494" from-port="0" to-layer="4496" to-port="1" /> + <edge from-layer="4495" from-port="0" to-layer="4496" to-port="2" /> + <edge from-layer="4496" from-port="3" to-layer="4497" to-port="1" /> + <edge from-layer="4497" from-port="2" to-layer="4500" to-port="2" /> + <edge from-layer="4498" from-port="0" to-layer="4500" to-port="3" /> + <edge from-layer="4499" from-port="0" to-layer="4500" to-port="4" /> + <edge from-layer="4500" from-port="5" to-layer="4501" to-port="3" /> + <edge from-layer="4501" from-port="4" to-layer="4503" to-port="0" /> + <edge from-layer="4502" from-port="0" to-layer="4503" to-port="1" /> + <edge from-layer="4503" from-port="2" to-layer="4505" to-port="0" /> + <edge from-layer="4504" from-port="0" to-layer="4505" to-port="1" /> + <edge from-layer="4505" from-port="2" to-layer="4516" to-port="0" /> + <edge from-layer="4506" from-port="0" to-layer="4507" to-port="0" /> + <edge from-layer="4507" from-port="1" to-layer="4510" to-port="0" /> + <edge from-layer="4508" from-port="0" to-layer="4509" to-port="0" /> + <edge from-layer="4509" from-port="1" to-layer="4510" to-port="1" /> + <edge from-layer="4510" from-port="2" to-layer="4512" to-port="0" /> + <edge from-layer="4511" from-port="0" to-layer="4512" to-port="1" /> + <edge from-layer="4512" from-port="2" to-layer="4514" to-port="0" /> + <edge from-layer="4513" from-port="0" to-layer="4514" to-port="1" /> + <edge from-layer="4514" from-port="2" to-layer="4515" to-port="0" /> + <edge from-layer="4515" from-port="1" to-layer="4516" to-port="1" /> + <edge from-layer="4516" from-port="2" to-layer="4517" to-port="1" /> + <edge from-layer="4517" from-port="2" to-layer="4521" to-port="0" /> + <edge from-layer="4517" from-port="2" to-layer="4528" to-port="0" /> + <edge from-layer="4517" from-port="2" to-layer="4565" to-port="0" /> + <edge from-layer="4518" from-port="0" to-layer="4529" to-port="0" /> + <edge from-layer="4519" from-port="0" to-layer="4527" to-port="0" /> + <edge from-layer="4520" from-port="0" to-layer="4521" to-port="1" /> + <edge from-layer="4521" from-port="2" to-layer="4523" to-port="0" /> + <edge from-layer="4522" from-port="0" to-layer="4523" to-port="1" /> + <edge from-layer="4523" from-port="2" to-layer="4525" to-port="0" /> + <edge from-layer="4524" from-port="0" to-layer="4525" to-port="1" /> + <edge from-layer="4525" from-port="2" to-layer="4526" to-port="0" /> + <edge from-layer="4526" from-port="1" to-layer="4527" to-port="1" /> + <edge from-layer="4527" from-port="2" to-layer="4528" to-port="1" /> + <edge from-layer="4528" from-port="2" to-layer="4529" to-port="1" /> + <edge from-layer="4529" from-port="2" to-layer="4540" to-port="0" /> + <edge from-layer="4529" from-port="2" to-layer="4552" to-port="0" /> + <edge from-layer="4530" from-port="0" to-layer="4531" to-port="0" /> + <edge from-layer="4531" from-port="1" to-layer="4534" to-port="0" /> + <edge from-layer="4532" from-port="0" to-layer="4533" to-port="0" /> + <edge from-layer="4533" from-port="1" to-layer="4534" to-port="1" /> + <edge from-layer="4534" from-port="2" to-layer="4536" to-port="0" /> + <edge from-layer="4535" from-port="0" to-layer="4536" to-port="1" /> + <edge from-layer="4536" from-port="2" to-layer="4538" to-port="0" /> + <edge from-layer="4537" from-port="0" to-layer="4538" to-port="1" /> + <edge from-layer="4538" from-port="2" to-layer="4539" to-port="0" /> + <edge from-layer="4539" from-port="1" to-layer="4540" to-port="1" /> + <edge from-layer="4540" from-port="2" to-layer="4541" to-port="0" /> + <edge from-layer="4541" from-port="1" to-layer="4553" to-port="0" /> + <edge from-layer="4542" from-port="0" to-layer="4543" to-port="0" /> + <edge from-layer="4543" from-port="1" to-layer="4546" to-port="0" /> + <edge from-layer="4544" from-port="0" to-layer="4545" to-port="0" /> + <edge from-layer="4545" from-port="1" to-layer="4546" to-port="1" /> + <edge from-layer="4546" from-port="2" to-layer="4548" to-port="0" /> + <edge from-layer="4547" from-port="0" to-layer="4548" to-port="1" /> + <edge from-layer="4548" from-port="2" to-layer="4550" to-port="0" /> + <edge from-layer="4549" from-port="0" to-layer="4550" to-port="1" /> + <edge from-layer="4550" from-port="2" to-layer="4551" to-port="0" /> + <edge from-layer="4551" from-port="1" to-layer="4552" to-port="1" /> + <edge from-layer="4552" from-port="2" to-layer="4553" to-port="1" /> + <edge from-layer="4553" from-port="2" to-layer="4564" to-port="0" /> + <edge from-layer="4554" from-port="0" to-layer="4555" to-port="0" /> + <edge from-layer="4555" from-port="1" to-layer="4558" to-port="0" /> + <edge from-layer="4556" from-port="0" to-layer="4557" to-port="0" /> + <edge from-layer="4557" from-port="1" to-layer="4558" to-port="1" /> + <edge from-layer="4558" from-port="2" to-layer="4560" to-port="0" /> + <edge from-layer="4559" from-port="0" to-layer="4560" to-port="1" /> + <edge from-layer="4560" from-port="2" to-layer="4562" to-port="0" /> + <edge from-layer="4561" from-port="0" to-layer="4562" to-port="1" /> + <edge from-layer="4562" from-port="2" to-layer="4563" to-port="0" /> + <edge from-layer="4563" from-port="1" to-layer="4564" to-port="1" /> + <edge from-layer="4564" from-port="2" to-layer="4565" to-port="1" /> + <edge from-layer="4565" from-port="2" to-layer="4749" to-port="0" /> + <edge from-layer="4565" from-port="2" to-layer="4569" to-port="0" /> + <edge from-layer="4565" from-port="2" to-layer="4576" to-port="0" /> + <edge from-layer="4566" from-port="0" to-layer="4577" to-port="0" /> + <edge from-layer="4567" from-port="0" to-layer="4575" to-port="0" /> + <edge from-layer="4568" from-port="0" to-layer="4569" to-port="1" /> + <edge from-layer="4569" from-port="2" to-layer="4571" to-port="0" /> + <edge from-layer="4570" from-port="0" to-layer="4571" to-port="1" /> + <edge from-layer="4571" from-port="2" to-layer="4573" to-port="0" /> + <edge from-layer="4572" from-port="0" to-layer="4573" to-port="1" /> + <edge from-layer="4573" from-port="2" to-layer="4574" to-port="0" /> + <edge from-layer="4574" from-port="1" to-layer="4575" to-port="1" /> + <edge from-layer="4575" from-port="2" to-layer="4576" to-port="1" /> + <edge from-layer="4576" from-port="2" to-layer="4577" to-port="1" /> + <edge from-layer="4577" from-port="2" to-layer="4636" to-port="0" /> + <edge from-layer="4577" from-port="2" to-layer="4698" to-port="0" /> + <edge from-layer="4577" from-port="2" to-layer="4588" to-port="0" /> + <edge from-layer="4578" from-port="0" to-layer="4579" to-port="0" /> + <edge from-layer="4579" from-port="1" to-layer="4582" to-port="0" /> + <edge from-layer="4580" from-port="0" to-layer="4581" to-port="0" /> + <edge from-layer="4581" from-port="1" to-layer="4582" to-port="1" /> + <edge from-layer="4582" from-port="2" to-layer="4584" to-port="0" /> + <edge from-layer="4583" from-port="0" to-layer="4584" to-port="1" /> + <edge from-layer="4584" from-port="2" to-layer="4586" to-port="0" /> + <edge from-layer="4585" from-port="0" to-layer="4586" to-port="1" /> + <edge from-layer="4586" from-port="2" to-layer="4587" to-port="0" /> + <edge from-layer="4587" from-port="1" to-layer="4588" to-port="1" /> + <edge from-layer="4588" from-port="2" to-layer="4591" to-port="0" /> + <edge from-layer="4589" from-port="0" to-layer="4590" to-port="0" /> + <edge from-layer="4590" from-port="1" to-layer="4591" to-port="1" /> + <edge from-layer="4591" from-port="2" to-layer="4593" to-port="0" /> + <edge from-layer="4592" from-port="0" to-layer="4593" to-port="1" /> + <edge from-layer="4593" from-port="2" to-layer="4595" to-port="0" /> + <edge from-layer="4594" from-port="0" to-layer="4595" to-port="1" /> + <edge from-layer="4595" from-port="2" to-layer="4596" to-port="0" /> + <edge from-layer="4595" from-port="2" to-layer="4613" to-port="0" /> + <edge from-layer="4595" from-port="2" to-layer="4607" to-port="0" /> + <edge from-layer="4595" from-port="2" to-layer="4597" to-port="0" /> + <edge from-layer="4596" from-port="2" to-layer="4616" to-port="0" /> + <edge from-layer="4597" from-port="1" to-layer="4599" to-port="0" /> + <edge from-layer="4598" from-port="0" to-layer="4599" to-port="2" /> + <edge from-layer="4599" from-port="3" to-layer="4600" to-port="0" /> + <edge from-layer="4600" from-port="2" to-layer="4601" to-port="0" /> + <edge from-layer="4601" from-port="1" to-layer="4603" to-port="0" /> + <edge from-layer="4602" from-port="0" to-layer="4603" to-port="1" /> + <edge from-layer="4603" from-port="2" to-layer="4613" to-port="2" /> + <edge from-layer="4603" from-port="2" to-layer="4607" to-port="1" /> + <edge from-layer="4604" from-port="0" to-layer="4607" to-port="2" /> + <edge from-layer="4605" from-port="0" to-layer="4607" to-port="3" /> + <edge from-layer="4606" from-port="0" to-layer="4607" to-port="4" /> + <edge from-layer="4607" from-port="5" to-layer="4609" to-port="0" /> + <edge from-layer="4608" from-port="0" to-layer="4609" to-port="1" /> + <edge from-layer="4609" from-port="2" to-layer="4614" to-port="0" /> + <edge from-layer="4610" from-port="0" to-layer="4613" to-port="1" /> + <edge from-layer="4611" from-port="0" to-layer="4613" to-port="3" /> + <edge from-layer="4612" from-port="0" to-layer="4613" to-port="4" /> + <edge from-layer="4613" from-port="5" to-layer="4614" to-port="1" /> + <edge from-layer="4614" from-port="2" to-layer="4615" to-port="0" /> + <edge from-layer="4615" from-port="2" to-layer="4616" to-port="1" /> + <edge from-layer="4616" from-port="2" to-layer="4733" to-port="0" /> + <edge from-layer="4617" from-port="0" to-layer="4622" to-port="0" /> + <edge from-layer="4618" from-port="0" to-layer="4621" to-port="1" /> + <edge from-layer="4619" from-port="0" to-layer="4621" to-port="2" /> + <edge from-layer="4620" from-port="0" to-layer="4621" to-port="3" /> + <edge from-layer="4621" from-port="4" to-layer="4622" to-port="1" /> + <edge from-layer="4622" from-port="2" to-layer="4623" to-port="0" /> + <edge from-layer="4623" from-port="1" to-layer="4625" to-port="0" /> + <edge from-layer="4624" from-port="0" to-layer="4625" to-port="2" /> + <edge from-layer="4625" from-port="3" to-layer="4721" to-port="0" /> + <edge from-layer="4625" from-port="3" to-layer="4665" to-port="0" /> + <edge from-layer="4626" from-port="0" to-layer="4627" to-port="0" /> + <edge from-layer="4627" from-port="1" to-layer="4630" to-port="0" /> + <edge from-layer="4628" from-port="0" to-layer="4629" to-port="0" /> + <edge from-layer="4629" from-port="1" to-layer="4630" to-port="1" /> + <edge from-layer="4630" from-port="2" to-layer="4632" to-port="0" /> + <edge from-layer="4631" from-port="0" to-layer="4632" to-port="1" /> + <edge from-layer="4632" from-port="2" to-layer="4634" to-port="0" /> + <edge from-layer="4633" from-port="0" to-layer="4634" to-port="1" /> + <edge from-layer="4634" from-port="2" to-layer="4635" to-port="0" /> + <edge from-layer="4635" from-port="1" to-layer="4636" to-port="1" /> + <edge from-layer="4636" from-port="2" to-layer="4639" to-port="0" /> + <edge from-layer="4637" from-port="0" to-layer="4638" to-port="0" /> + <edge from-layer="4638" from-port="1" to-layer="4639" to-port="1" /> + <edge from-layer="4639" from-port="2" to-layer="4641" to-port="0" /> + <edge from-layer="4640" from-port="0" to-layer="4641" to-port="1" /> + <edge from-layer="4641" from-port="2" to-layer="4643" to-port="0" /> + <edge from-layer="4642" from-port="0" to-layer="4643" to-port="1" /> + <edge from-layer="4643" from-port="2" to-layer="4661" to-port="0" /> + <edge from-layer="4643" from-port="2" to-layer="4655" to-port="0" /> + <edge from-layer="4643" from-port="2" to-layer="4645" to-port="0" /> + <edge from-layer="4643" from-port="2" to-layer="4644" to-port="0" /> + <edge from-layer="4644" from-port="2" to-layer="4664" to-port="0" /> + <edge from-layer="4645" from-port="1" to-layer="4647" to-port="0" /> + <edge from-layer="4646" from-port="0" to-layer="4647" to-port="2" /> + <edge from-layer="4647" from-port="3" to-layer="4648" to-port="0" /> + <edge from-layer="4648" from-port="2" to-layer="4649" to-port="0" /> + <edge from-layer="4649" from-port="1" to-layer="4651" to-port="0" /> + <edge from-layer="4650" from-port="0" to-layer="4651" to-port="1" /> + <edge from-layer="4651" from-port="2" to-layer="4661" to-port="2" /> + <edge from-layer="4651" from-port="2" to-layer="4655" to-port="1" /> + <edge from-layer="4652" from-port="0" to-layer="4655" to-port="2" /> + <edge from-layer="4653" from-port="0" to-layer="4655" to-port="3" /> + <edge from-layer="4654" from-port="0" to-layer="4655" to-port="4" /> + <edge from-layer="4655" from-port="5" to-layer="4657" to-port="0" /> + <edge from-layer="4656" from-port="0" to-layer="4657" to-port="1" /> + <edge from-layer="4657" from-port="2" to-layer="4662" to-port="0" /> + <edge from-layer="4658" from-port="0" to-layer="4661" to-port="1" /> + <edge from-layer="4659" from-port="0" to-layer="4661" to-port="3" /> + <edge from-layer="4660" from-port="0" to-layer="4661" to-port="4" /> + <edge from-layer="4661" from-port="5" to-layer="4662" to-port="1" /> + <edge from-layer="4662" from-port="2" to-layer="4663" to-port="0" /> + <edge from-layer="4663" from-port="2" to-layer="4664" to-port="1" /> + <edge from-layer="4664" from-port="2" to-layer="4725" to-port="0" /> + <edge from-layer="4664" from-port="2" to-layer="4665" to-port="1" /> + <edge from-layer="4665" from-port="2" to-layer="4666" to-port="0" /> + <edge from-layer="4665" from-port="2" to-layer="11204" to-port="0" /> + <edge from-layer="4665" from-port="2" to-layer="4667" to-port="0" /> + <edge from-layer="4666" from-port="2" to-layer="4676" to-port="0" /> + <edge from-layer="4667" from-port="1" to-layer="4670" to-port="0" /> + <edge from-layer="4667" from-port="1" to-layer="4674" to-port="0" /> + <edge from-layer="4668" from-port="0" to-layer="4670" to-port="1" /> + <edge from-layer="4669" from-port="0" to-layer="4670" to-port="2" /> + <edge from-layer="4670" from-port="3" to-layer="4675" to-port="0" /> + <edge from-layer="4671" from-port="0" to-layer="4675" to-port="1" /> + <edge from-layer="4672" from-port="0" to-layer="4674" to-port="1" /> + <edge from-layer="4673" from-port="0" to-layer="4674" to-port="2" /> + <edge from-layer="4674" from-port="3" to-layer="4675" to-port="2" /> + <edge from-layer="4675" from-port="3" to-layer="4676" to-port="1" /> + <edge from-layer="4676" from-port="2" to-layer="4678" to-port="0" /> + <edge from-layer="4677" from-port="0" to-layer="4678" to-port="1" /> + <edge from-layer="4678" from-port="2" to-layer="4733" to-port="1" /> + <edge from-layer="4679" from-port="0" to-layer="4684" to-port="0" /> + <edge from-layer="4680" from-port="0" to-layer="4683" to-port="1" /> + <edge from-layer="4681" from-port="0" to-layer="4683" to-port="2" /> + <edge from-layer="4682" from-port="0" to-layer="4683" to-port="3" /> + <edge from-layer="4683" from-port="4" to-layer="4684" to-port="1" /> + <edge from-layer="4684" from-port="2" to-layer="4685" to-port="0" /> + <edge from-layer="4685" from-port="1" to-layer="4687" to-port="0" /> + <edge from-layer="4686" from-port="0" to-layer="4687" to-port="2" /> + <edge from-layer="4687" from-port="3" to-layer="4706" to-port="0" /> + <edge from-layer="4688" from-port="0" to-layer="4689" to-port="0" /> + <edge from-layer="4689" from-port="1" to-layer="4692" to-port="0" /> + <edge from-layer="4690" from-port="0" to-layer="4691" to-port="0" /> + <edge from-layer="4691" from-port="1" to-layer="4692" to-port="1" /> + <edge from-layer="4692" from-port="2" to-layer="4694" to-port="0" /> + <edge from-layer="4693" from-port="0" to-layer="4694" to-port="1" /> + <edge from-layer="4694" from-port="2" to-layer="4696" to-port="0" /> + <edge from-layer="4695" from-port="0" to-layer="4696" to-port="1" /> + <edge from-layer="4696" from-port="2" to-layer="4697" to-port="0" /> + <edge from-layer="4697" from-port="1" to-layer="4698" to-port="1" /> + <edge from-layer="4698" from-port="2" to-layer="4701" to-port="0" /> + <edge from-layer="4699" from-port="0" to-layer="4700" to-port="0" /> + <edge from-layer="4700" from-port="1" to-layer="4701" to-port="1" /> + <edge from-layer="4701" from-port="2" to-layer="4703" to-port="0" /> + <edge from-layer="4702" from-port="0" to-layer="4703" to-port="1" /> + <edge from-layer="4703" from-port="2" to-layer="4705" to-port="0" /> + <edge from-layer="4704" from-port="0" to-layer="4705" to-port="1" /> + <edge from-layer="4705" from-port="2" to-layer="4706" to-port="1" /> + <edge from-layer="4706" from-port="2" to-layer="4707" to-port="0" /> + <edge from-layer="4706" from-port="2" to-layer="4708" to-port="0" /> + <edge from-layer="4706" from-port="2" to-layer="11203" to-port="0" /> + <edge from-layer="4707" from-port="2" to-layer="4717" to-port="0" /> + <edge from-layer="4708" from-port="1" to-layer="4711" to-port="0" /> + <edge from-layer="4708" from-port="1" to-layer="4715" to-port="0" /> + <edge from-layer="4709" from-port="0" to-layer="4711" to-port="1" /> + <edge from-layer="4710" from-port="0" to-layer="4711" to-port="2" /> + <edge from-layer="4711" from-port="3" to-layer="4716" to-port="1" /> + <edge from-layer="4712" from-port="0" to-layer="4716" to-port="2" /> + <edge from-layer="4713" from-port="0" to-layer="4715" to-port="1" /> + <edge from-layer="4714" from-port="0" to-layer="4715" to-port="2" /> + <edge from-layer="4715" from-port="3" to-layer="4716" to-port="3" /> + <edge from-layer="4716" from-port="4" to-layer="4717" to-port="1" /> + <edge from-layer="4717" from-port="2" to-layer="4719" to-port="0" /> + <edge from-layer="4718" from-port="0" to-layer="4719" to-port="1" /> + <edge from-layer="4719" from-port="2" to-layer="4733" to-port="2" /> + <edge from-layer="4720" from-port="0" to-layer="4732" to-port="1" /> + <edge from-layer="4721" from-port="1" to-layer="4724" to-port="0" /> + <edge from-layer="4722" from-port="0" to-layer="4724" to-port="1" /> + <edge from-layer="4723" from-port="0" to-layer="4724" to-port="2" /> + <edge from-layer="4724" from-port="3" to-layer="4729" to-port="0" /> + <edge from-layer="4725" from-port="1" to-layer="4728" to-port="0" /> + <edge from-layer="4726" from-port="0" to-layer="4728" to-port="1" /> + <edge from-layer="4727" from-port="0" to-layer="4728" to-port="2" /> + <edge from-layer="4728" from-port="3" to-layer="4729" to-port="1" /> + <edge from-layer="4729" from-port="2" to-layer="4732" to-port="2" /> + <edge from-layer="4730" from-port="0" to-layer="4732" to-port="3" /> + <edge from-layer="4731" from-port="0" to-layer="4732" to-port="4" /> + <edge from-layer="4732" from-port="5" to-layer="4733" to-port="3" /> + <edge from-layer="4733" from-port="4" to-layer="4735" to-port="0" /> + <edge from-layer="4734" from-port="0" to-layer="4735" to-port="1" /> + <edge from-layer="4735" from-port="2" to-layer="4737" to-port="0" /> + <edge from-layer="4736" from-port="0" to-layer="4737" to-port="1" /> + <edge from-layer="4737" from-port="2" to-layer="4748" to-port="0" /> + <edge from-layer="4738" from-port="0" to-layer="4739" to-port="0" /> + <edge from-layer="4739" from-port="1" to-layer="4742" to-port="0" /> + <edge from-layer="4740" from-port="0" to-layer="4741" to-port="0" /> + <edge from-layer="4741" from-port="1" to-layer="4742" to-port="1" /> + <edge from-layer="4742" from-port="2" to-layer="4744" to-port="0" /> + <edge from-layer="4743" from-port="0" to-layer="4744" to-port="1" /> + <edge from-layer="4744" from-port="2" to-layer="4746" to-port="0" /> + <edge from-layer="4745" from-port="0" to-layer="4746" to-port="1" /> + <edge from-layer="4746" from-port="2" to-layer="4747" to-port="0" /> + <edge from-layer="4747" from-port="1" to-layer="4748" to-port="1" /> + <edge from-layer="4748" from-port="2" to-layer="4749" to-port="1" /> + <edge from-layer="4749" from-port="2" to-layer="4753" to-port="0" /> + <edge from-layer="4749" from-port="2" to-layer="4760" to-port="0" /> + <edge from-layer="4749" from-port="2" to-layer="4797" to-port="0" /> + <edge from-layer="4750" from-port="0" to-layer="4761" to-port="0" /> + <edge from-layer="4751" from-port="0" to-layer="4759" to-port="0" /> + <edge from-layer="4752" from-port="0" to-layer="4753" to-port="1" /> + <edge from-layer="4753" from-port="2" to-layer="4755" to-port="0" /> + <edge from-layer="4754" from-port="0" to-layer="4755" to-port="1" /> + <edge from-layer="4755" from-port="2" to-layer="4757" to-port="0" /> + <edge from-layer="4756" from-port="0" to-layer="4757" to-port="1" /> + <edge from-layer="4757" from-port="2" to-layer="4758" to-port="0" /> + <edge from-layer="4758" from-port="1" to-layer="4759" to-port="1" /> + <edge from-layer="4759" from-port="2" to-layer="4760" to-port="1" /> + <edge from-layer="4760" from-port="2" to-layer="4761" to-port="1" /> + <edge from-layer="4761" from-port="2" to-layer="4772" to-port="0" /> + <edge from-layer="4761" from-port="2" to-layer="4784" to-port="0" /> + <edge from-layer="4762" from-port="0" to-layer="4763" to-port="0" /> + <edge from-layer="4763" from-port="1" to-layer="4766" to-port="0" /> + <edge from-layer="4764" from-port="0" to-layer="4765" to-port="0" /> + <edge from-layer="4765" from-port="1" to-layer="4766" to-port="1" /> + <edge from-layer="4766" from-port="2" to-layer="4768" to-port="0" /> + <edge from-layer="4767" from-port="0" to-layer="4768" to-port="1" /> + <edge from-layer="4768" from-port="2" to-layer="4770" to-port="0" /> + <edge from-layer="4769" from-port="0" to-layer="4770" to-port="1" /> + <edge from-layer="4770" from-port="2" to-layer="4771" to-port="0" /> + <edge from-layer="4771" from-port="1" to-layer="4772" to-port="1" /> + <edge from-layer="4772" from-port="2" to-layer="4773" to-port="0" /> + <edge from-layer="4773" from-port="1" to-layer="4785" to-port="0" /> + <edge from-layer="4774" from-port="0" to-layer="4775" to-port="0" /> + <edge from-layer="4775" from-port="1" to-layer="4778" to-port="0" /> + <edge from-layer="4776" from-port="0" to-layer="4777" to-port="0" /> + <edge from-layer="4777" from-port="1" to-layer="4778" to-port="1" /> + <edge from-layer="4778" from-port="2" to-layer="4780" to-port="0" /> + <edge from-layer="4779" from-port="0" to-layer="4780" to-port="1" /> + <edge from-layer="4780" from-port="2" to-layer="4782" to-port="0" /> + <edge from-layer="4781" from-port="0" to-layer="4782" to-port="1" /> + <edge from-layer="4782" from-port="2" to-layer="4783" to-port="0" /> + <edge from-layer="4783" from-port="1" to-layer="4784" to-port="1" /> + <edge from-layer="4784" from-port="2" to-layer="4785" to-port="1" /> + <edge from-layer="4785" from-port="2" to-layer="4796" to-port="0" /> + <edge from-layer="4786" from-port="0" to-layer="4787" to-port="0" /> + <edge from-layer="4787" from-port="1" to-layer="4790" to-port="0" /> + <edge from-layer="4788" from-port="0" to-layer="4789" to-port="0" /> + <edge from-layer="4789" from-port="1" to-layer="4790" to-port="1" /> + <edge from-layer="4790" from-port="2" to-layer="4792" to-port="0" /> + <edge from-layer="4791" from-port="0" to-layer="4792" to-port="1" /> + <edge from-layer="4792" from-port="2" to-layer="4794" to-port="0" /> + <edge from-layer="4793" from-port="0" to-layer="4794" to-port="1" /> + <edge from-layer="4794" from-port="2" to-layer="4795" to-port="0" /> + <edge from-layer="4795" from-port="1" to-layer="4796" to-port="1" /> + <edge from-layer="4796" from-port="2" to-layer="4797" to-port="1" /> + <edge from-layer="4797" from-port="2" to-layer="4981" to-port="0" /> + <edge from-layer="4797" from-port="2" to-layer="4801" to-port="0" /> + <edge from-layer="4797" from-port="2" to-layer="4808" to-port="0" /> + <edge from-layer="4798" from-port="0" to-layer="4809" to-port="0" /> + <edge from-layer="4799" from-port="0" to-layer="4807" to-port="0" /> + <edge from-layer="4800" from-port="0" to-layer="4801" to-port="1" /> + <edge from-layer="4801" from-port="2" to-layer="4803" to-port="0" /> + <edge from-layer="4802" from-port="0" to-layer="4803" to-port="1" /> + <edge from-layer="4803" from-port="2" to-layer="4805" to-port="0" /> + <edge from-layer="4804" from-port="0" to-layer="4805" to-port="1" /> + <edge from-layer="4805" from-port="2" to-layer="4806" to-port="0" /> + <edge from-layer="4806" from-port="1" to-layer="4807" to-port="1" /> + <edge from-layer="4807" from-port="2" to-layer="4808" to-port="1" /> + <edge from-layer="4808" from-port="2" to-layer="4809" to-port="1" /> + <edge from-layer="4809" from-port="2" to-layer="4820" to-port="0" /> + <edge from-layer="4809" from-port="2" to-layer="4868" to-port="0" /> + <edge from-layer="4809" from-port="2" to-layer="4930" to-port="0" /> + <edge from-layer="4810" from-port="0" to-layer="4811" to-port="0" /> + <edge from-layer="4811" from-port="1" to-layer="4814" to-port="0" /> + <edge from-layer="4812" from-port="0" to-layer="4813" to-port="0" /> + <edge from-layer="4813" from-port="1" to-layer="4814" to-port="1" /> + <edge from-layer="4814" from-port="2" to-layer="4816" to-port="0" /> + <edge from-layer="4815" from-port="0" to-layer="4816" to-port="1" /> + <edge from-layer="4816" from-port="2" to-layer="4818" to-port="0" /> + <edge from-layer="4817" from-port="0" to-layer="4818" to-port="1" /> + <edge from-layer="4818" from-port="2" to-layer="4819" to-port="0" /> + <edge from-layer="4819" from-port="1" to-layer="4820" to-port="1" /> + <edge from-layer="4820" from-port="2" to-layer="4823" to-port="0" /> + <edge from-layer="4821" from-port="0" to-layer="4822" to-port="0" /> + <edge from-layer="4822" from-port="1" to-layer="4823" to-port="1" /> + <edge from-layer="4823" from-port="2" to-layer="4825" to-port="0" /> + <edge from-layer="4824" from-port="0" to-layer="4825" to-port="1" /> + <edge from-layer="4825" from-port="2" to-layer="4827" to-port="0" /> + <edge from-layer="4826" from-port="0" to-layer="4827" to-port="1" /> + <edge from-layer="4827" from-port="2" to-layer="4829" to-port="0" /> + <edge from-layer="4827" from-port="2" to-layer="4845" to-port="0" /> + <edge from-layer="4827" from-port="2" to-layer="4828" to-port="0" /> + <edge from-layer="4827" from-port="2" to-layer="4839" to-port="0" /> + <edge from-layer="4828" from-port="2" to-layer="4848" to-port="0" /> + <edge from-layer="4829" from-port="1" to-layer="4831" to-port="0" /> + <edge from-layer="4830" from-port="0" to-layer="4831" to-port="2" /> + <edge from-layer="4831" from-port="3" to-layer="4832" to-port="0" /> + <edge from-layer="4832" from-port="2" to-layer="4833" to-port="0" /> + <edge from-layer="4833" from-port="1" to-layer="4835" to-port="0" /> + <edge from-layer="4834" from-port="0" to-layer="4835" to-port="1" /> + <edge from-layer="4835" from-port="2" to-layer="4845" to-port="2" /> + <edge from-layer="4835" from-port="2" to-layer="4839" to-port="1" /> + <edge from-layer="4836" from-port="0" to-layer="4839" to-port="2" /> + <edge from-layer="4837" from-port="0" to-layer="4839" to-port="3" /> + <edge from-layer="4838" from-port="0" to-layer="4839" to-port="4" /> + <edge from-layer="4839" from-port="5" to-layer="4841" to-port="0" /> + <edge from-layer="4840" from-port="0" to-layer="4841" to-port="1" /> + <edge from-layer="4841" from-port="2" to-layer="4846" to-port="0" /> + <edge from-layer="4842" from-port="0" to-layer="4845" to-port="1" /> + <edge from-layer="4843" from-port="0" to-layer="4845" to-port="3" /> + <edge from-layer="4844" from-port="0" to-layer="4845" to-port="4" /> + <edge from-layer="4845" from-port="5" to-layer="4846" to-port="1" /> + <edge from-layer="4846" from-port="2" to-layer="4847" to-port="0" /> + <edge from-layer="4847" from-port="2" to-layer="4848" to-port="1" /> + <edge from-layer="4848" from-port="2" to-layer="4965" to-port="0" /> + <edge from-layer="4849" from-port="0" to-layer="4854" to-port="0" /> + <edge from-layer="4850" from-port="0" to-layer="4853" to-port="1" /> + <edge from-layer="4851" from-port="0" to-layer="4853" to-port="2" /> + <edge from-layer="4852" from-port="0" to-layer="4853" to-port="3" /> + <edge from-layer="4853" from-port="4" to-layer="4854" to-port="1" /> + <edge from-layer="4854" from-port="2" to-layer="4855" to-port="0" /> + <edge from-layer="4855" from-port="1" to-layer="4857" to-port="0" /> + <edge from-layer="4856" from-port="0" to-layer="4857" to-port="2" /> + <edge from-layer="4857" from-port="3" to-layer="4897" to-port="0" /> + <edge from-layer="4857" from-port="3" to-layer="4953" to-port="0" /> + <edge from-layer="4858" from-port="0" to-layer="4859" to-port="0" /> + <edge from-layer="4859" from-port="1" to-layer="4862" to-port="0" /> + <edge from-layer="4860" from-port="0" to-layer="4861" to-port="0" /> + <edge from-layer="4861" from-port="1" to-layer="4862" to-port="1" /> + <edge from-layer="4862" from-port="2" to-layer="4864" to-port="0" /> + <edge from-layer="4863" from-port="0" to-layer="4864" to-port="1" /> + <edge from-layer="4864" from-port="2" to-layer="4866" to-port="0" /> + <edge from-layer="4865" from-port="0" to-layer="4866" to-port="1" /> + <edge from-layer="4866" from-port="2" to-layer="4867" to-port="0" /> + <edge from-layer="4867" from-port="1" to-layer="4868" to-port="1" /> + <edge from-layer="4868" from-port="2" to-layer="4871" to-port="0" /> + <edge from-layer="4869" from-port="0" to-layer="4870" to-port="0" /> + <edge from-layer="4870" from-port="1" to-layer="4871" to-port="1" /> + <edge from-layer="4871" from-port="2" to-layer="4873" to-port="0" /> + <edge from-layer="4872" from-port="0" to-layer="4873" to-port="1" /> + <edge from-layer="4873" from-port="2" to-layer="4875" to-port="0" /> + <edge from-layer="4874" from-port="0" to-layer="4875" to-port="1" /> + <edge from-layer="4875" from-port="2" to-layer="4876" to-port="0" /> + <edge from-layer="4875" from-port="2" to-layer="4877" to-port="0" /> + <edge from-layer="4875" from-port="2" to-layer="4887" to-port="0" /> + <edge from-layer="4875" from-port="2" to-layer="4893" to-port="0" /> + <edge from-layer="4876" from-port="2" to-layer="4896" to-port="0" /> + <edge from-layer="4877" from-port="1" to-layer="4879" to-port="0" /> + <edge from-layer="4878" from-port="0" to-layer="4879" to-port="2" /> + <edge from-layer="4879" from-port="3" to-layer="4880" to-port="0" /> + <edge from-layer="4880" from-port="2" to-layer="4881" to-port="0" /> + <edge from-layer="4881" from-port="1" to-layer="4883" to-port="0" /> + <edge from-layer="4882" from-port="0" to-layer="4883" to-port="1" /> + <edge from-layer="4883" from-port="2" to-layer="4893" to-port="2" /> + <edge from-layer="4883" from-port="2" to-layer="4887" to-port="1" /> + <edge from-layer="4884" from-port="0" to-layer="4887" to-port="2" /> + <edge from-layer="4885" from-port="0" to-layer="4887" to-port="3" /> + <edge from-layer="4886" from-port="0" to-layer="4887" to-port="4" /> + <edge from-layer="4887" from-port="5" to-layer="4889" to-port="0" /> + <edge from-layer="4888" from-port="0" to-layer="4889" to-port="1" /> + <edge from-layer="4889" from-port="2" to-layer="4894" to-port="0" /> + <edge from-layer="4890" from-port="0" to-layer="4893" to-port="1" /> + <edge from-layer="4891" from-port="0" to-layer="4893" to-port="3" /> + <edge from-layer="4892" from-port="0" to-layer="4893" to-port="4" /> + <edge from-layer="4893" from-port="5" to-layer="4894" to-port="1" /> + <edge from-layer="4894" from-port="2" to-layer="4895" to-port="0" /> + <edge from-layer="4895" from-port="2" to-layer="4896" to-port="1" /> + <edge from-layer="4896" from-port="2" to-layer="4897" to-port="1" /> + <edge from-layer="4896" from-port="2" to-layer="4957" to-port="0" /> + <edge from-layer="4897" from-port="2" to-layer="4898" to-port="0" /> + <edge from-layer="4897" from-port="2" to-layer="4899" to-port="0" /> + <edge from-layer="4897" from-port="2" to-layer="11200" to-port="0" /> + <edge from-layer="4898" from-port="2" to-layer="4908" to-port="0" /> + <edge from-layer="4899" from-port="1" to-layer="4902" to-port="0" /> + <edge from-layer="4899" from-port="1" to-layer="4906" to-port="0" /> + <edge from-layer="4900" from-port="0" to-layer="4902" to-port="1" /> + <edge from-layer="4901" from-port="0" to-layer="4902" to-port="2" /> + <edge from-layer="4902" from-port="3" to-layer="4907" to-port="0" /> + <edge from-layer="4903" from-port="0" to-layer="4907" to-port="1" /> + <edge from-layer="4904" from-port="0" to-layer="4906" to-port="1" /> + <edge from-layer="4905" from-port="0" to-layer="4906" to-port="2" /> + <edge from-layer="4906" from-port="3" to-layer="4907" to-port="2" /> + <edge from-layer="4907" from-port="3" to-layer="4908" to-port="1" /> + <edge from-layer="4908" from-port="2" to-layer="4910" to-port="0" /> + <edge from-layer="4909" from-port="0" to-layer="4910" to-port="1" /> + <edge from-layer="4910" from-port="2" to-layer="4965" to-port="1" /> + <edge from-layer="4911" from-port="0" to-layer="4916" to-port="0" /> + <edge from-layer="4912" from-port="0" to-layer="4915" to-port="1" /> + <edge from-layer="4913" from-port="0" to-layer="4915" to-port="2" /> + <edge from-layer="4914" from-port="0" to-layer="4915" to-port="3" /> + <edge from-layer="4915" from-port="4" to-layer="4916" to-port="1" /> + <edge from-layer="4916" from-port="2" to-layer="4917" to-port="0" /> + <edge from-layer="4917" from-port="1" to-layer="4919" to-port="0" /> + <edge from-layer="4918" from-port="0" to-layer="4919" to-port="2" /> + <edge from-layer="4919" from-port="3" to-layer="4938" to-port="0" /> + <edge from-layer="4920" from-port="0" to-layer="4921" to-port="0" /> + <edge from-layer="4921" from-port="1" to-layer="4924" to-port="0" /> + <edge from-layer="4922" from-port="0" to-layer="4923" to-port="0" /> + <edge from-layer="4923" from-port="1" to-layer="4924" to-port="1" /> + <edge from-layer="4924" from-port="2" to-layer="4926" to-port="0" /> + <edge from-layer="4925" from-port="0" to-layer="4926" to-port="1" /> + <edge from-layer="4926" from-port="2" to-layer="4928" to-port="0" /> + <edge from-layer="4927" from-port="0" to-layer="4928" to-port="1" /> + <edge from-layer="4928" from-port="2" to-layer="4929" to-port="0" /> + <edge from-layer="4929" from-port="1" to-layer="4930" to-port="1" /> + <edge from-layer="4930" from-port="2" to-layer="4933" to-port="0" /> + <edge from-layer="4931" from-port="0" to-layer="4932" to-port="0" /> + <edge from-layer="4932" from-port="1" to-layer="4933" to-port="1" /> + <edge from-layer="4933" from-port="2" to-layer="4935" to-port="0" /> + <edge from-layer="4934" from-port="0" to-layer="4935" to-port="1" /> + <edge from-layer="4935" from-port="2" to-layer="4937" to-port="0" /> + <edge from-layer="4936" from-port="0" to-layer="4937" to-port="1" /> + <edge from-layer="4937" from-port="2" to-layer="4938" to-port="1" /> + <edge from-layer="4938" from-port="2" to-layer="11199" to-port="0" /> + <edge from-layer="4938" from-port="2" to-layer="4939" to-port="0" /> + <edge from-layer="4938" from-port="2" to-layer="4940" to-port="0" /> + <edge from-layer="4939" from-port="2" to-layer="4949" to-port="0" /> + <edge from-layer="4940" from-port="1" to-layer="4943" to-port="0" /> + <edge from-layer="4940" from-port="1" to-layer="4947" to-port="0" /> + <edge from-layer="4941" from-port="0" to-layer="4943" to-port="1" /> + <edge from-layer="4942" from-port="0" to-layer="4943" to-port="2" /> + <edge from-layer="4943" from-port="3" to-layer="4948" to-port="1" /> + <edge from-layer="4944" from-port="0" to-layer="4948" to-port="2" /> + <edge from-layer="4945" from-port="0" to-layer="4947" to-port="1" /> + <edge from-layer="4946" from-port="0" to-layer="4947" to-port="2" /> + <edge from-layer="4947" from-port="3" to-layer="4948" to-port="3" /> + <edge from-layer="4948" from-port="4" to-layer="4949" to-port="1" /> + <edge from-layer="4949" from-port="2" to-layer="4951" to-port="0" /> + <edge from-layer="4950" from-port="0" to-layer="4951" to-port="1" /> + <edge from-layer="4951" from-port="2" to-layer="4965" to-port="2" /> + <edge from-layer="4952" from-port="0" to-layer="4964" to-port="1" /> + <edge from-layer="4953" from-port="1" to-layer="4956" to-port="0" /> + <edge from-layer="4954" from-port="0" to-layer="4956" to-port="1" /> + <edge from-layer="4955" from-port="0" to-layer="4956" to-port="2" /> + <edge from-layer="4956" from-port="3" to-layer="4961" to-port="0" /> + <edge from-layer="4957" from-port="1" to-layer="4960" to-port="0" /> + <edge from-layer="4958" from-port="0" to-layer="4960" to-port="1" /> + <edge from-layer="4959" from-port="0" to-layer="4960" to-port="2" /> + <edge from-layer="4960" from-port="3" to-layer="4961" to-port="1" /> + <edge from-layer="4961" from-port="2" to-layer="4964" to-port="2" /> + <edge from-layer="4962" from-port="0" to-layer="4964" to-port="3" /> + <edge from-layer="4963" from-port="0" to-layer="4964" to-port="4" /> + <edge from-layer="4964" from-port="5" to-layer="4965" to-port="3" /> + <edge from-layer="4965" from-port="4" to-layer="4967" to-port="0" /> + <edge from-layer="4966" from-port="0" to-layer="4967" to-port="1" /> + <edge from-layer="4967" from-port="2" to-layer="4969" to-port="0" /> + <edge from-layer="4968" from-port="0" to-layer="4969" to-port="1" /> + <edge from-layer="4969" from-port="2" to-layer="4980" to-port="0" /> + <edge from-layer="4970" from-port="0" to-layer="4971" to-port="0" /> + <edge from-layer="4971" from-port="1" to-layer="4974" to-port="0" /> + <edge from-layer="4972" from-port="0" to-layer="4973" to-port="0" /> + <edge from-layer="4973" from-port="1" to-layer="4974" to-port="1" /> + <edge from-layer="4974" from-port="2" to-layer="4976" to-port="0" /> + <edge from-layer="4975" from-port="0" to-layer="4976" to-port="1" /> + <edge from-layer="4976" from-port="2" to-layer="4978" to-port="0" /> + <edge from-layer="4977" from-port="0" to-layer="4978" to-port="1" /> + <edge from-layer="4978" from-port="2" to-layer="4979" to-port="0" /> + <edge from-layer="4979" from-port="1" to-layer="4980" to-port="1" /> + <edge from-layer="4980" from-port="2" to-layer="4981" to-port="1" /> + <edge from-layer="4981" from-port="2" to-layer="4992" to-port="0" /> + <edge from-layer="4981" from-port="2" to-layer="5029" to-port="0" /> + <edge from-layer="4981" from-port="2" to-layer="4985" to-port="0" /> + <edge from-layer="4982" from-port="0" to-layer="4993" to-port="0" /> + <edge from-layer="4983" from-port="0" to-layer="4991" to-port="0" /> + <edge from-layer="4984" from-port="0" to-layer="4985" to-port="1" /> + <edge from-layer="4985" from-port="2" to-layer="4987" to-port="0" /> + <edge from-layer="4986" from-port="0" to-layer="4987" to-port="1" /> + <edge from-layer="4987" from-port="2" to-layer="4989" to-port="0" /> + <edge from-layer="4988" from-port="0" to-layer="4989" to-port="1" /> + <edge from-layer="4989" from-port="2" to-layer="4990" to-port="0" /> + <edge from-layer="4990" from-port="1" to-layer="4991" to-port="1" /> + <edge from-layer="4991" from-port="2" to-layer="4992" to-port="1" /> + <edge from-layer="4992" from-port="2" to-layer="4993" to-port="1" /> + <edge from-layer="4993" from-port="2" to-layer="5016" to-port="0" /> + <edge from-layer="4993" from-port="2" to-layer="5004" to-port="0" /> + <edge from-layer="4994" from-port="0" to-layer="4995" to-port="0" /> + <edge from-layer="4995" from-port="1" to-layer="4998" to-port="0" /> + <edge from-layer="4996" from-port="0" to-layer="4997" to-port="0" /> + <edge from-layer="4997" from-port="1" to-layer="4998" to-port="1" /> + <edge from-layer="4998" from-port="2" to-layer="5000" to-port="0" /> + <edge from-layer="4999" from-port="0" to-layer="5000" to-port="1" /> + <edge from-layer="5000" from-port="2" to-layer="5002" to-port="0" /> + <edge from-layer="5001" from-port="0" to-layer="5002" to-port="1" /> + <edge from-layer="5002" from-port="2" to-layer="5003" to-port="0" /> + <edge from-layer="5003" from-port="1" to-layer="5004" to-port="1" /> + <edge from-layer="5004" from-port="2" to-layer="5005" to-port="0" /> + <edge from-layer="5005" from-port="1" to-layer="5017" to-port="0" /> + <edge from-layer="5006" from-port="0" to-layer="5007" to-port="0" /> + <edge from-layer="5007" from-port="1" to-layer="5010" to-port="0" /> + <edge from-layer="5008" from-port="0" to-layer="5009" to-port="0" /> + <edge from-layer="5009" from-port="1" to-layer="5010" to-port="1" /> + <edge from-layer="5010" from-port="2" to-layer="5012" to-port="0" /> + <edge from-layer="5011" from-port="0" to-layer="5012" to-port="1" /> + <edge from-layer="5012" from-port="2" to-layer="5014" to-port="0" /> + <edge from-layer="5013" from-port="0" to-layer="5014" to-port="1" /> + <edge from-layer="5014" from-port="2" to-layer="5015" to-port="0" /> + <edge from-layer="5015" from-port="1" to-layer="5016" to-port="1" /> + <edge from-layer="5016" from-port="2" to-layer="5017" to-port="1" /> + <edge from-layer="5017" from-port="2" to-layer="5028" to-port="0" /> + <edge from-layer="5018" from-port="0" to-layer="5019" to-port="0" /> + <edge from-layer="5019" from-port="1" to-layer="5022" to-port="0" /> + <edge from-layer="5020" from-port="0" to-layer="5021" to-port="0" /> + <edge from-layer="5021" from-port="1" to-layer="5022" to-port="1" /> + <edge from-layer="5022" from-port="2" to-layer="5024" to-port="0" /> + <edge from-layer="5023" from-port="0" to-layer="5024" to-port="1" /> + <edge from-layer="5024" from-port="2" to-layer="5026" to-port="0" /> + <edge from-layer="5025" from-port="0" to-layer="5026" to-port="1" /> + <edge from-layer="5026" from-port="2" to-layer="5027" to-port="0" /> + <edge from-layer="5027" from-port="1" to-layer="5028" to-port="1" /> + <edge from-layer="5028" from-port="2" to-layer="5029" to-port="1" /> + <edge from-layer="5029" from-port="2" to-layer="5213" to-port="0" /> + <edge from-layer="5029" from-port="2" to-layer="5040" to-port="0" /> + <edge from-layer="5029" from-port="2" to-layer="5033" to-port="0" /> + <edge from-layer="5030" from-port="0" to-layer="5041" to-port="0" /> + <edge from-layer="5031" from-port="0" to-layer="5039" to-port="0" /> + <edge from-layer="5032" from-port="0" to-layer="5033" to-port="1" /> + <edge from-layer="5033" from-port="2" to-layer="5035" to-port="0" /> + <edge from-layer="5034" from-port="0" to-layer="5035" to-port="1" /> + <edge from-layer="5035" from-port="2" to-layer="5037" to-port="0" /> + <edge from-layer="5036" from-port="0" to-layer="5037" to-port="1" /> + <edge from-layer="5037" from-port="2" to-layer="5038" to-port="0" /> + <edge from-layer="5038" from-port="1" to-layer="5039" to-port="1" /> + <edge from-layer="5039" from-port="2" to-layer="5040" to-port="1" /> + <edge from-layer="5040" from-port="2" to-layer="5041" to-port="1" /> + <edge from-layer="5041" from-port="2" to-layer="5052" to-port="0" /> + <edge from-layer="5041" from-port="2" to-layer="5100" to-port="0" /> + <edge from-layer="5041" from-port="2" to-layer="5162" to-port="0" /> + <edge from-layer="5042" from-port="0" to-layer="5043" to-port="0" /> + <edge from-layer="5043" from-port="1" to-layer="5046" to-port="0" /> + <edge from-layer="5044" from-port="0" to-layer="5045" to-port="0" /> + <edge from-layer="5045" from-port="1" to-layer="5046" to-port="1" /> + <edge from-layer="5046" from-port="2" to-layer="5048" to-port="0" /> + <edge from-layer="5047" from-port="0" to-layer="5048" to-port="1" /> + <edge from-layer="5048" from-port="2" to-layer="5050" to-port="0" /> + <edge from-layer="5049" from-port="0" to-layer="5050" to-port="1" /> + <edge from-layer="5050" from-port="2" to-layer="5051" to-port="0" /> + <edge from-layer="5051" from-port="1" to-layer="5052" to-port="1" /> + <edge from-layer="5052" from-port="2" to-layer="5055" to-port="0" /> + <edge from-layer="5053" from-port="0" to-layer="5054" to-port="0" /> + <edge from-layer="5054" from-port="1" to-layer="5055" to-port="1" /> + <edge from-layer="5055" from-port="2" to-layer="5057" to-port="0" /> + <edge from-layer="5056" from-port="0" to-layer="5057" to-port="1" /> + <edge from-layer="5057" from-port="2" to-layer="5059" to-port="0" /> + <edge from-layer="5058" from-port="0" to-layer="5059" to-port="1" /> + <edge from-layer="5059" from-port="2" to-layer="5060" to-port="0" /> + <edge from-layer="5059" from-port="2" to-layer="5061" to-port="0" /> + <edge from-layer="5059" from-port="2" to-layer="5071" to-port="0" /> + <edge from-layer="5059" from-port="2" to-layer="5077" to-port="0" /> + <edge from-layer="5060" from-port="2" to-layer="5080" to-port="0" /> + <edge from-layer="5061" from-port="1" to-layer="5063" to-port="0" /> + <edge from-layer="5062" from-port="0" to-layer="5063" to-port="2" /> + <edge from-layer="5063" from-port="3" to-layer="5064" to-port="0" /> + <edge from-layer="5064" from-port="2" to-layer="5065" to-port="0" /> + <edge from-layer="5065" from-port="1" to-layer="5067" to-port="0" /> + <edge from-layer="5066" from-port="0" to-layer="5067" to-port="1" /> + <edge from-layer="5067" from-port="2" to-layer="5071" to-port="1" /> + <edge from-layer="5067" from-port="2" to-layer="5077" to-port="2" /> + <edge from-layer="5068" from-port="0" to-layer="5071" to-port="2" /> + <edge from-layer="5069" from-port="0" to-layer="5071" to-port="3" /> + <edge from-layer="5070" from-port="0" to-layer="5071" to-port="4" /> + <edge from-layer="5071" from-port="5" to-layer="5073" to-port="0" /> + <edge from-layer="5072" from-port="0" to-layer="5073" to-port="1" /> + <edge from-layer="5073" from-port="2" to-layer="5078" to-port="0" /> + <edge from-layer="5074" from-port="0" to-layer="5077" to-port="1" /> + <edge from-layer="5075" from-port="0" to-layer="5077" to-port="3" /> + <edge from-layer="5076" from-port="0" to-layer="5077" to-port="4" /> + <edge from-layer="5077" from-port="5" to-layer="5078" to-port="1" /> + <edge from-layer="5078" from-port="2" to-layer="5079" to-port="0" /> + <edge from-layer="5079" from-port="2" to-layer="5080" to-port="1" /> + <edge from-layer="5080" from-port="2" to-layer="5197" to-port="0" /> + <edge from-layer="5081" from-port="0" to-layer="5086" to-port="0" /> + <edge from-layer="5082" from-port="0" to-layer="5085" to-port="1" /> + <edge from-layer="5083" from-port="0" to-layer="5085" to-port="2" /> + <edge from-layer="5084" from-port="0" to-layer="5085" to-port="3" /> + <edge from-layer="5085" from-port="4" to-layer="5086" to-port="1" /> + <edge from-layer="5086" from-port="2" to-layer="5087" to-port="0" /> + <edge from-layer="5087" from-port="1" to-layer="5089" to-port="0" /> + <edge from-layer="5088" from-port="0" to-layer="5089" to-port="2" /> + <edge from-layer="5089" from-port="3" to-layer="5185" to-port="0" /> + <edge from-layer="5089" from-port="3" to-layer="5129" to-port="0" /> + <edge from-layer="5090" from-port="0" to-layer="5091" to-port="0" /> + <edge from-layer="5091" from-port="1" to-layer="5094" to-port="0" /> + <edge from-layer="5092" from-port="0" to-layer="5093" to-port="0" /> + <edge from-layer="5093" from-port="1" to-layer="5094" to-port="1" /> + <edge from-layer="5094" from-port="2" to-layer="5096" to-port="0" /> + <edge from-layer="5095" from-port="0" to-layer="5096" to-port="1" /> + <edge from-layer="5096" from-port="2" to-layer="5098" to-port="0" /> + <edge from-layer="5097" from-port="0" to-layer="5098" to-port="1" /> + <edge from-layer="5098" from-port="2" to-layer="5099" to-port="0" /> + <edge from-layer="5099" from-port="1" to-layer="5100" to-port="1" /> + <edge from-layer="5100" from-port="2" to-layer="5103" to-port="0" /> + <edge from-layer="5101" from-port="0" to-layer="5102" to-port="0" /> + <edge from-layer="5102" from-port="1" to-layer="5103" to-port="1" /> + <edge from-layer="5103" from-port="2" to-layer="5105" to-port="0" /> + <edge from-layer="5104" from-port="0" to-layer="5105" to-port="1" /> + <edge from-layer="5105" from-port="2" to-layer="5107" to-port="0" /> + <edge from-layer="5106" from-port="0" to-layer="5107" to-port="1" /> + <edge from-layer="5107" from-port="2" to-layer="5108" to-port="0" /> + <edge from-layer="5107" from-port="2" to-layer="5109" to-port="0" /> + <edge from-layer="5107" from-port="2" to-layer="5125" to-port="0" /> + <edge from-layer="5107" from-port="2" to-layer="5119" to-port="0" /> + <edge from-layer="5108" from-port="2" to-layer="5128" to-port="0" /> + <edge from-layer="5109" from-port="1" to-layer="5111" to-port="0" /> + <edge from-layer="5110" from-port="0" to-layer="5111" to-port="2" /> + <edge from-layer="5111" from-port="3" to-layer="5112" to-port="0" /> + <edge from-layer="5112" from-port="2" to-layer="5113" to-port="0" /> + <edge from-layer="5113" from-port="1" to-layer="5115" to-port="0" /> + <edge from-layer="5114" from-port="0" to-layer="5115" to-port="1" /> + <edge from-layer="5115" from-port="2" to-layer="5119" to-port="1" /> + <edge from-layer="5115" from-port="2" to-layer="5125" to-port="2" /> + <edge from-layer="5116" from-port="0" to-layer="5119" to-port="2" /> + <edge from-layer="5117" from-port="0" to-layer="5119" to-port="3" /> + <edge from-layer="5118" from-port="0" to-layer="5119" to-port="4" /> + <edge from-layer="5119" from-port="5" to-layer="5121" to-port="0" /> + <edge from-layer="5120" from-port="0" to-layer="5121" to-port="1" /> + <edge from-layer="5121" from-port="2" to-layer="5126" to-port="0" /> + <edge from-layer="5122" from-port="0" to-layer="5125" to-port="1" /> + <edge from-layer="5123" from-port="0" to-layer="5125" to-port="3" /> + <edge from-layer="5124" from-port="0" to-layer="5125" to-port="4" /> + <edge from-layer="5125" from-port="5" to-layer="5126" to-port="1" /> + <edge from-layer="5126" from-port="2" to-layer="5127" to-port="0" /> + <edge from-layer="5127" from-port="2" to-layer="5128" to-port="1" /> + <edge from-layer="5128" from-port="2" to-layer="5129" to-port="1" /> + <edge from-layer="5128" from-port="2" to-layer="5189" to-port="0" /> + <edge from-layer="5129" from-port="2" to-layer="5131" to-port="0" /> + <edge from-layer="5129" from-port="2" to-layer="11198" to-port="0" /> + <edge from-layer="5129" from-port="2" to-layer="5130" to-port="0" /> + <edge from-layer="5130" from-port="2" to-layer="5140" to-port="0" /> + <edge from-layer="5131" from-port="1" to-layer="5134" to-port="0" /> + <edge from-layer="5131" from-port="1" to-layer="5138" to-port="0" /> + <edge from-layer="5132" from-port="0" to-layer="5134" to-port="1" /> + <edge from-layer="5133" from-port="0" to-layer="5134" to-port="2" /> + <edge from-layer="5134" from-port="3" to-layer="5139" to-port="0" /> + <edge from-layer="5135" from-port="0" to-layer="5139" to-port="1" /> + <edge from-layer="5136" from-port="0" to-layer="5138" to-port="1" /> + <edge from-layer="5137" from-port="0" to-layer="5138" to-port="2" /> + <edge from-layer="5138" from-port="3" to-layer="5139" to-port="2" /> + <edge from-layer="5139" from-port="3" to-layer="5140" to-port="1" /> + <edge from-layer="5140" from-port="2" to-layer="5142" to-port="0" /> + <edge from-layer="5141" from-port="0" to-layer="5142" to-port="1" /> + <edge from-layer="5142" from-port="2" to-layer="5197" to-port="1" /> + <edge from-layer="5143" from-port="0" to-layer="5148" to-port="0" /> + <edge from-layer="5144" from-port="0" to-layer="5147" to-port="1" /> + <edge from-layer="5145" from-port="0" to-layer="5147" to-port="2" /> + <edge from-layer="5146" from-port="0" to-layer="5147" to-port="3" /> + <edge from-layer="5147" from-port="4" to-layer="5148" to-port="1" /> + <edge from-layer="5148" from-port="2" to-layer="5149" to-port="0" /> + <edge from-layer="5149" from-port="1" to-layer="5151" to-port="0" /> + <edge from-layer="5150" from-port="0" to-layer="5151" to-port="2" /> + <edge from-layer="5151" from-port="3" to-layer="5170" to-port="0" /> + <edge from-layer="5152" from-port="0" to-layer="5153" to-port="0" /> + <edge from-layer="5153" from-port="1" to-layer="5156" to-port="0" /> + <edge from-layer="5154" from-port="0" to-layer="5155" to-port="0" /> + <edge from-layer="5155" from-port="1" to-layer="5156" to-port="1" /> + <edge from-layer="5156" from-port="2" to-layer="5158" to-port="0" /> + <edge from-layer="5157" from-port="0" to-layer="5158" to-port="1" /> + <edge from-layer="5158" from-port="2" to-layer="5160" to-port="0" /> + <edge from-layer="5159" from-port="0" to-layer="5160" to-port="1" /> + <edge from-layer="5160" from-port="2" to-layer="5161" to-port="0" /> + <edge from-layer="5161" from-port="1" to-layer="5162" to-port="1" /> + <edge from-layer="5162" from-port="2" to-layer="5165" to-port="0" /> + <edge from-layer="5163" from-port="0" to-layer="5164" to-port="0" /> + <edge from-layer="5164" from-port="1" to-layer="5165" to-port="1" /> + <edge from-layer="5165" from-port="2" to-layer="5167" to-port="0" /> + <edge from-layer="5166" from-port="0" to-layer="5167" to-port="1" /> + <edge from-layer="5167" from-port="2" to-layer="5169" to-port="0" /> + <edge from-layer="5168" from-port="0" to-layer="5169" to-port="1" /> + <edge from-layer="5169" from-port="2" to-layer="5170" to-port="1" /> + <edge from-layer="5170" from-port="2" to-layer="5171" to-port="0" /> + <edge from-layer="5170" from-port="2" to-layer="5172" to-port="0" /> + <edge from-layer="5170" from-port="2" to-layer="11197" to-port="0" /> + <edge from-layer="5171" from-port="2" to-layer="5181" to-port="0" /> + <edge from-layer="5172" from-port="1" to-layer="5179" to-port="0" /> + <edge from-layer="5172" from-port="1" to-layer="5175" to-port="0" /> + <edge from-layer="5173" from-port="0" to-layer="5175" to-port="1" /> + <edge from-layer="5174" from-port="0" to-layer="5175" to-port="2" /> + <edge from-layer="5175" from-port="3" to-layer="5180" to-port="1" /> + <edge from-layer="5176" from-port="0" to-layer="5180" to-port="2" /> + <edge from-layer="5177" from-port="0" to-layer="5179" to-port="1" /> + <edge from-layer="5178" from-port="0" to-layer="5179" to-port="2" /> + <edge from-layer="5179" from-port="3" to-layer="5180" to-port="3" /> + <edge from-layer="5180" from-port="4" to-layer="5181" to-port="1" /> + <edge from-layer="5181" from-port="2" to-layer="5183" to-port="0" /> + <edge from-layer="5182" from-port="0" to-layer="5183" to-port="1" /> + <edge from-layer="5183" from-port="2" to-layer="5197" to-port="2" /> + <edge from-layer="5184" from-port="0" to-layer="5196" to-port="1" /> + <edge from-layer="5185" from-port="1" to-layer="5188" to-port="0" /> + <edge from-layer="5186" from-port="0" to-layer="5188" to-port="1" /> + <edge from-layer="5187" from-port="0" to-layer="5188" to-port="2" /> + <edge from-layer="5188" from-port="3" to-layer="5193" to-port="0" /> + <edge from-layer="5189" from-port="1" to-layer="5192" to-port="0" /> + <edge from-layer="5190" from-port="0" to-layer="5192" to-port="1" /> + <edge from-layer="5191" from-port="0" to-layer="5192" to-port="2" /> + <edge from-layer="5192" from-port="3" to-layer="5193" to-port="1" /> + <edge from-layer="5193" from-port="2" to-layer="5196" to-port="2" /> + <edge from-layer="5194" from-port="0" to-layer="5196" to-port="3" /> + <edge from-layer="5195" from-port="0" to-layer="5196" to-port="4" /> + <edge from-layer="5196" from-port="5" to-layer="5197" to-port="3" /> + <edge from-layer="5197" from-port="4" to-layer="5199" to-port="0" /> + <edge from-layer="5198" from-port="0" to-layer="5199" to-port="1" /> + <edge from-layer="5199" from-port="2" to-layer="5201" to-port="0" /> + <edge from-layer="5200" from-port="0" to-layer="5201" to-port="1" /> + <edge from-layer="5201" from-port="2" to-layer="5212" to-port="0" /> + <edge from-layer="5202" from-port="0" to-layer="5203" to-port="0" /> + <edge from-layer="5203" from-port="1" to-layer="5206" to-port="0" /> + <edge from-layer="5204" from-port="0" to-layer="5205" to-port="0" /> + <edge from-layer="5205" from-port="1" to-layer="5206" to-port="1" /> + <edge from-layer="5206" from-port="2" to-layer="5208" to-port="0" /> + <edge from-layer="5207" from-port="0" to-layer="5208" to-port="1" /> + <edge from-layer="5208" from-port="2" to-layer="5210" to-port="0" /> + <edge from-layer="5209" from-port="0" to-layer="5210" to-port="1" /> + <edge from-layer="5210" from-port="2" to-layer="5211" to-port="0" /> + <edge from-layer="5211" from-port="1" to-layer="5212" to-port="1" /> + <edge from-layer="5212" from-port="2" to-layer="5213" to-port="1" /> + <edge from-layer="5213" from-port="2" to-layer="5224" to-port="0" /> + <edge from-layer="5213" from-port="2" to-layer="5261" to-port="0" /> + <edge from-layer="5213" from-port="2" to-layer="5217" to-port="0" /> + <edge from-layer="5214" from-port="0" to-layer="5225" to-port="0" /> + <edge from-layer="5215" from-port="0" to-layer="5223" to-port="0" /> + <edge from-layer="5216" from-port="0" to-layer="5217" to-port="1" /> + <edge from-layer="5217" from-port="2" to-layer="5219" to-port="0" /> + <edge from-layer="5218" from-port="0" to-layer="5219" to-port="1" /> + <edge from-layer="5219" from-port="2" to-layer="5221" to-port="0" /> + <edge from-layer="5220" from-port="0" to-layer="5221" to-port="1" /> + <edge from-layer="5221" from-port="2" to-layer="5222" to-port="0" /> + <edge from-layer="5222" from-port="1" to-layer="5223" to-port="1" /> + <edge from-layer="5223" from-port="2" to-layer="5224" to-port="1" /> + <edge from-layer="5224" from-port="2" to-layer="5225" to-port="1" /> + <edge from-layer="5225" from-port="2" to-layer="5236" to-port="0" /> + <edge from-layer="5225" from-port="2" to-layer="5248" to-port="0" /> + <edge from-layer="5226" from-port="0" to-layer="5227" to-port="0" /> + <edge from-layer="5227" from-port="1" to-layer="5230" to-port="0" /> + <edge from-layer="5228" from-port="0" to-layer="5229" to-port="0" /> + <edge from-layer="5229" from-port="1" to-layer="5230" to-port="1" /> + <edge from-layer="5230" from-port="2" to-layer="5232" to-port="0" /> + <edge from-layer="5231" from-port="0" to-layer="5232" to-port="1" /> + <edge from-layer="5232" from-port="2" to-layer="5234" to-port="0" /> + <edge from-layer="5233" from-port="0" to-layer="5234" to-port="1" /> + <edge from-layer="5234" from-port="2" to-layer="5235" to-port="0" /> + <edge from-layer="5235" from-port="1" to-layer="5236" to-port="1" /> + <edge from-layer="5236" from-port="2" to-layer="5237" to-port="0" /> + <edge from-layer="5237" from-port="1" to-layer="5249" to-port="0" /> + <edge from-layer="5238" from-port="0" to-layer="5239" to-port="0" /> + <edge from-layer="5239" from-port="1" to-layer="5242" to-port="0" /> + <edge from-layer="5240" from-port="0" to-layer="5241" to-port="0" /> + <edge from-layer="5241" from-port="1" to-layer="5242" to-port="1" /> + <edge from-layer="5242" from-port="2" to-layer="5244" to-port="0" /> + <edge from-layer="5243" from-port="0" to-layer="5244" to-port="1" /> + <edge from-layer="5244" from-port="2" to-layer="5246" to-port="0" /> + <edge from-layer="5245" from-port="0" to-layer="5246" to-port="1" /> + <edge from-layer="5246" from-port="2" to-layer="5247" to-port="0" /> + <edge from-layer="5247" from-port="1" to-layer="5248" to-port="1" /> + <edge from-layer="5248" from-port="2" to-layer="5249" to-port="1" /> + <edge from-layer="5249" from-port="2" to-layer="5260" to-port="0" /> + <edge from-layer="5250" from-port="0" to-layer="5251" to-port="0" /> + <edge from-layer="5251" from-port="1" to-layer="5254" to-port="0" /> + <edge from-layer="5252" from-port="0" to-layer="5253" to-port="0" /> + <edge from-layer="5253" from-port="1" to-layer="5254" to-port="1" /> + <edge from-layer="5254" from-port="2" to-layer="5256" to-port="0" /> + <edge from-layer="5255" from-port="0" to-layer="5256" to-port="1" /> + <edge from-layer="5256" from-port="2" to-layer="5258" to-port="0" /> + <edge from-layer="5257" from-port="0" to-layer="5258" to-port="1" /> + <edge from-layer="5258" from-port="2" to-layer="5259" to-port="0" /> + <edge from-layer="5259" from-port="1" to-layer="5260" to-port="1" /> + <edge from-layer="5260" from-port="2" to-layer="5261" to-port="1" /> + <edge from-layer="5261" from-port="2" to-layer="5272" to-port="0" /> + <edge from-layer="5261" from-port="2" to-layer="5445" to-port="0" /> + <edge from-layer="5261" from-port="2" to-layer="5265" to-port="0" /> + <edge from-layer="5262" from-port="0" to-layer="5273" to-port="0" /> + <edge from-layer="5263" from-port="0" to-layer="5271" to-port="0" /> + <edge from-layer="5264" from-port="0" to-layer="5265" to-port="1" /> + <edge from-layer="5265" from-port="2" to-layer="5267" to-port="0" /> + <edge from-layer="5266" from-port="0" to-layer="5267" to-port="1" /> + <edge from-layer="5267" from-port="2" to-layer="5269" to-port="0" /> + <edge from-layer="5268" from-port="0" to-layer="5269" to-port="1" /> + <edge from-layer="5269" from-port="2" to-layer="5270" to-port="0" /> + <edge from-layer="5270" from-port="1" to-layer="5271" to-port="1" /> + <edge from-layer="5271" from-port="2" to-layer="5272" to-port="1" /> + <edge from-layer="5272" from-port="2" to-layer="5273" to-port="1" /> + <edge from-layer="5273" from-port="2" to-layer="5332" to-port="0" /> + <edge from-layer="5273" from-port="2" to-layer="5284" to-port="0" /> + <edge from-layer="5273" from-port="2" to-layer="5394" to-port="0" /> + <edge from-layer="5274" from-port="0" to-layer="5275" to-port="0" /> + <edge from-layer="5275" from-port="1" to-layer="5278" to-port="0" /> + <edge from-layer="5276" from-port="0" to-layer="5277" to-port="0" /> + <edge from-layer="5277" from-port="1" to-layer="5278" to-port="1" /> + <edge from-layer="5278" from-port="2" to-layer="5280" to-port="0" /> + <edge from-layer="5279" from-port="0" to-layer="5280" to-port="1" /> + <edge from-layer="5280" from-port="2" to-layer="5282" to-port="0" /> + <edge from-layer="5281" from-port="0" to-layer="5282" to-port="1" /> + <edge from-layer="5282" from-port="2" to-layer="5283" to-port="0" /> + <edge from-layer="5283" from-port="1" to-layer="5284" to-port="1" /> + <edge from-layer="5284" from-port="2" to-layer="5287" to-port="0" /> + <edge from-layer="5285" from-port="0" to-layer="5286" to-port="0" /> + <edge from-layer="5286" from-port="1" to-layer="5287" to-port="1" /> + <edge from-layer="5287" from-port="2" to-layer="5289" to-port="0" /> + <edge from-layer="5288" from-port="0" to-layer="5289" to-port="1" /> + <edge from-layer="5289" from-port="2" to-layer="5291" to-port="0" /> + <edge from-layer="5290" from-port="0" to-layer="5291" to-port="1" /> + <edge from-layer="5291" from-port="2" to-layer="5292" to-port="0" /> + <edge from-layer="5291" from-port="2" to-layer="5293" to-port="0" /> + <edge from-layer="5291" from-port="2" to-layer="5309" to-port="0" /> + <edge from-layer="5291" from-port="2" to-layer="5303" to-port="0" /> + <edge from-layer="5292" from-port="2" to-layer="5312" to-port="0" /> + <edge from-layer="5293" from-port="1" to-layer="5295" to-port="0" /> + <edge from-layer="5294" from-port="0" to-layer="5295" to-port="2" /> + <edge from-layer="5295" from-port="3" to-layer="5296" to-port="0" /> + <edge from-layer="5296" from-port="2" to-layer="5297" to-port="0" /> + <edge from-layer="5297" from-port="1" to-layer="5299" to-port="0" /> + <edge from-layer="5298" from-port="0" to-layer="5299" to-port="1" /> + <edge from-layer="5299" from-port="2" to-layer="5309" to-port="2" /> + <edge from-layer="5299" from-port="2" to-layer="5303" to-port="1" /> + <edge from-layer="5300" from-port="0" to-layer="5303" to-port="2" /> + <edge from-layer="5301" from-port="0" to-layer="5303" to-port="3" /> + <edge from-layer="5302" from-port="0" to-layer="5303" to-port="4" /> + <edge from-layer="5303" from-port="5" to-layer="5305" to-port="0" /> + <edge from-layer="5304" from-port="0" to-layer="5305" to-port="1" /> + <edge from-layer="5305" from-port="2" to-layer="5310" to-port="0" /> + <edge from-layer="5306" from-port="0" to-layer="5309" to-port="1" /> + <edge from-layer="5307" from-port="0" to-layer="5309" to-port="3" /> + <edge from-layer="5308" from-port="0" to-layer="5309" to-port="4" /> + <edge from-layer="5309" from-port="5" to-layer="5310" to-port="1" /> + <edge from-layer="5310" from-port="2" to-layer="5311" to-port="0" /> + <edge from-layer="5311" from-port="2" to-layer="5312" to-port="1" /> + <edge from-layer="5312" from-port="2" to-layer="5429" to-port="0" /> + <edge from-layer="5313" from-port="0" to-layer="5318" to-port="0" /> + <edge from-layer="5314" from-port="0" to-layer="5317" to-port="1" /> + <edge from-layer="5315" from-port="0" to-layer="5317" to-port="2" /> + <edge from-layer="5316" from-port="0" to-layer="5317" to-port="3" /> + <edge from-layer="5317" from-port="4" to-layer="5318" to-port="1" /> + <edge from-layer="5318" from-port="2" to-layer="5319" to-port="0" /> + <edge from-layer="5319" from-port="1" to-layer="5321" to-port="0" /> + <edge from-layer="5320" from-port="0" to-layer="5321" to-port="2" /> + <edge from-layer="5321" from-port="3" to-layer="5361" to-port="0" /> + <edge from-layer="5321" from-port="3" to-layer="5417" to-port="0" /> + <edge from-layer="5322" from-port="0" to-layer="5323" to-port="0" /> + <edge from-layer="5323" from-port="1" to-layer="5326" to-port="0" /> + <edge from-layer="5324" from-port="0" to-layer="5325" to-port="0" /> + <edge from-layer="5325" from-port="1" to-layer="5326" to-port="1" /> + <edge from-layer="5326" from-port="2" to-layer="5328" to-port="0" /> + <edge from-layer="5327" from-port="0" to-layer="5328" to-port="1" /> + <edge from-layer="5328" from-port="2" to-layer="5330" to-port="0" /> + <edge from-layer="5329" from-port="0" to-layer="5330" to-port="1" /> + <edge from-layer="5330" from-port="2" to-layer="5331" to-port="0" /> + <edge from-layer="5331" from-port="1" to-layer="5332" to-port="1" /> + <edge from-layer="5332" from-port="2" to-layer="5335" to-port="0" /> + <edge from-layer="5333" from-port="0" to-layer="5334" to-port="0" /> + <edge from-layer="5334" from-port="1" to-layer="5335" to-port="1" /> + <edge from-layer="5335" from-port="2" to-layer="5337" to-port="0" /> + <edge from-layer="5336" from-port="0" to-layer="5337" to-port="1" /> + <edge from-layer="5337" from-port="2" to-layer="5339" to-port="0" /> + <edge from-layer="5338" from-port="0" to-layer="5339" to-port="1" /> + <edge from-layer="5339" from-port="2" to-layer="5351" to-port="0" /> + <edge from-layer="5339" from-port="2" to-layer="5357" to-port="0" /> + <edge from-layer="5339" from-port="2" to-layer="5341" to-port="0" /> + <edge from-layer="5339" from-port="2" to-layer="5340" to-port="0" /> + <edge from-layer="5340" from-port="2" to-layer="5360" to-port="0" /> + <edge from-layer="5341" from-port="1" to-layer="5343" to-port="0" /> + <edge from-layer="5342" from-port="0" to-layer="5343" to-port="2" /> + <edge from-layer="5343" from-port="3" to-layer="5344" to-port="0" /> + <edge from-layer="5344" from-port="2" to-layer="5345" to-port="0" /> + <edge from-layer="5345" from-port="1" to-layer="5347" to-port="0" /> + <edge from-layer="5346" from-port="0" to-layer="5347" to-port="1" /> + <edge from-layer="5347" from-port="2" to-layer="5351" to-port="1" /> + <edge from-layer="5347" from-port="2" to-layer="5357" to-port="2" /> + <edge from-layer="5348" from-port="0" to-layer="5351" to-port="2" /> + <edge from-layer="5349" from-port="0" to-layer="5351" to-port="3" /> + <edge from-layer="5350" from-port="0" to-layer="5351" to-port="4" /> + <edge from-layer="5351" from-port="5" to-layer="5353" to-port="0" /> + <edge from-layer="5352" from-port="0" to-layer="5353" to-port="1" /> + <edge from-layer="5353" from-port="2" to-layer="5358" to-port="0" /> + <edge from-layer="5354" from-port="0" to-layer="5357" to-port="1" /> + <edge from-layer="5355" from-port="0" to-layer="5357" to-port="3" /> + <edge from-layer="5356" from-port="0" to-layer="5357" to-port="4" /> + <edge from-layer="5357" from-port="5" to-layer="5358" to-port="1" /> + <edge from-layer="5358" from-port="2" to-layer="5359" to-port="0" /> + <edge from-layer="5359" from-port="2" to-layer="5360" to-port="1" /> + <edge from-layer="5360" from-port="2" to-layer="5421" to-port="0" /> + <edge from-layer="5360" from-port="2" to-layer="5361" to-port="1" /> + <edge from-layer="5361" from-port="2" to-layer="11196" to-port="0" /> + <edge from-layer="5361" from-port="2" to-layer="5362" to-port="0" /> + <edge from-layer="5361" from-port="2" to-layer="5363" to-port="0" /> + <edge from-layer="5362" from-port="2" to-layer="5372" to-port="0" /> + <edge from-layer="5363" from-port="1" to-layer="5366" to-port="0" /> + <edge from-layer="5363" from-port="1" to-layer="5370" to-port="0" /> + <edge from-layer="5364" from-port="0" to-layer="5366" to-port="1" /> + <edge from-layer="5365" from-port="0" to-layer="5366" to-port="2" /> + <edge from-layer="5366" from-port="3" to-layer="5371" to-port="0" /> + <edge from-layer="5367" from-port="0" to-layer="5371" to-port="1" /> + <edge from-layer="5368" from-port="0" to-layer="5370" to-port="1" /> + <edge from-layer="5369" from-port="0" to-layer="5370" to-port="2" /> + <edge from-layer="5370" from-port="3" to-layer="5371" to-port="2" /> + <edge from-layer="5371" from-port="3" to-layer="5372" to-port="1" /> + <edge from-layer="5372" from-port="2" to-layer="5374" to-port="0" /> + <edge from-layer="5373" from-port="0" to-layer="5374" to-port="1" /> + <edge from-layer="5374" from-port="2" to-layer="5429" to-port="1" /> + <edge from-layer="5375" from-port="0" to-layer="5380" to-port="0" /> + <edge from-layer="5376" from-port="0" to-layer="5379" to-port="1" /> + <edge from-layer="5377" from-port="0" to-layer="5379" to-port="2" /> + <edge from-layer="5378" from-port="0" to-layer="5379" to-port="3" /> + <edge from-layer="5379" from-port="4" to-layer="5380" to-port="1" /> + <edge from-layer="5380" from-port="2" to-layer="5381" to-port="0" /> + <edge from-layer="5381" from-port="1" to-layer="5383" to-port="0" /> + <edge from-layer="5382" from-port="0" to-layer="5383" to-port="2" /> + <edge from-layer="5383" from-port="3" to-layer="5402" to-port="0" /> + <edge from-layer="5384" from-port="0" to-layer="5385" to-port="0" /> + <edge from-layer="5385" from-port="1" to-layer="5388" to-port="0" /> + <edge from-layer="5386" from-port="0" to-layer="5387" to-port="0" /> + <edge from-layer="5387" from-port="1" to-layer="5388" to-port="1" /> + <edge from-layer="5388" from-port="2" to-layer="5390" to-port="0" /> + <edge from-layer="5389" from-port="0" to-layer="5390" to-port="1" /> + <edge from-layer="5390" from-port="2" to-layer="5392" to-port="0" /> + <edge from-layer="5391" from-port="0" to-layer="5392" to-port="1" /> + <edge from-layer="5392" from-port="2" to-layer="5393" to-port="0" /> + <edge from-layer="5393" from-port="1" to-layer="5394" to-port="1" /> + <edge from-layer="5394" from-port="2" to-layer="5397" to-port="0" /> + <edge from-layer="5395" from-port="0" to-layer="5396" to-port="0" /> + <edge from-layer="5396" from-port="1" to-layer="5397" to-port="1" /> + <edge from-layer="5397" from-port="2" to-layer="5399" to-port="0" /> + <edge from-layer="5398" from-port="0" to-layer="5399" to-port="1" /> + <edge from-layer="5399" from-port="2" to-layer="5401" to-port="0" /> + <edge from-layer="5400" from-port="0" to-layer="5401" to-port="1" /> + <edge from-layer="5401" from-port="2" to-layer="5402" to-port="1" /> + <edge from-layer="5402" from-port="2" to-layer="11195" to-port="0" /> + <edge from-layer="5402" from-port="2" to-layer="5403" to-port="0" /> + <edge from-layer="5402" from-port="2" to-layer="5404" to-port="0" /> + <edge from-layer="5403" from-port="2" to-layer="5413" to-port="0" /> + <edge from-layer="5404" from-port="1" to-layer="5407" to-port="0" /> + <edge from-layer="5404" from-port="1" to-layer="5411" to-port="0" /> + <edge from-layer="5405" from-port="0" to-layer="5407" to-port="1" /> + <edge from-layer="5406" from-port="0" to-layer="5407" to-port="2" /> + <edge from-layer="5407" from-port="3" to-layer="5412" to-port="1" /> + <edge from-layer="5408" from-port="0" to-layer="5412" to-port="2" /> + <edge from-layer="5409" from-port="0" to-layer="5411" to-port="1" /> + <edge from-layer="5410" from-port="0" to-layer="5411" to-port="2" /> + <edge from-layer="5411" from-port="3" to-layer="5412" to-port="3" /> + <edge from-layer="5412" from-port="4" to-layer="5413" to-port="1" /> + <edge from-layer="5413" from-port="2" to-layer="5415" to-port="0" /> + <edge from-layer="5414" from-port="0" to-layer="5415" to-port="1" /> + <edge from-layer="5415" from-port="2" to-layer="5429" to-port="2" /> + <edge from-layer="5416" from-port="0" to-layer="5428" to-port="1" /> + <edge from-layer="5417" from-port="1" to-layer="5420" to-port="0" /> + <edge from-layer="5418" from-port="0" to-layer="5420" to-port="1" /> + <edge from-layer="5419" from-port="0" to-layer="5420" to-port="2" /> + <edge from-layer="5420" from-port="3" to-layer="5425" to-port="0" /> + <edge from-layer="5421" from-port="1" to-layer="5424" to-port="0" /> + <edge from-layer="5422" from-port="0" to-layer="5424" to-port="1" /> + <edge from-layer="5423" from-port="0" to-layer="5424" to-port="2" /> + <edge from-layer="5424" from-port="3" to-layer="5425" to-port="1" /> + <edge from-layer="5425" from-port="2" to-layer="5428" to-port="2" /> + <edge from-layer="5426" from-port="0" to-layer="5428" to-port="3" /> + <edge from-layer="5427" from-port="0" to-layer="5428" to-port="4" /> + <edge from-layer="5428" from-port="5" to-layer="5429" to-port="3" /> + <edge from-layer="5429" from-port="4" to-layer="5431" to-port="0" /> + <edge from-layer="5430" from-port="0" to-layer="5431" to-port="1" /> + <edge from-layer="5431" from-port="2" to-layer="5433" to-port="0" /> + <edge from-layer="5432" from-port="0" to-layer="5433" to-port="1" /> + <edge from-layer="5433" from-port="2" to-layer="5444" to-port="0" /> + <edge from-layer="5434" from-port="0" to-layer="5435" to-port="0" /> + <edge from-layer="5435" from-port="1" to-layer="5438" to-port="0" /> + <edge from-layer="5436" from-port="0" to-layer="5437" to-port="0" /> + <edge from-layer="5437" from-port="1" to-layer="5438" to-port="1" /> + <edge from-layer="5438" from-port="2" to-layer="5440" to-port="0" /> + <edge from-layer="5439" from-port="0" to-layer="5440" to-port="1" /> + <edge from-layer="5440" from-port="2" to-layer="5442" to-port="0" /> + <edge from-layer="5441" from-port="0" to-layer="5442" to-port="1" /> + <edge from-layer="5442" from-port="2" to-layer="5443" to-port="0" /> + <edge from-layer="5443" from-port="1" to-layer="5444" to-port="1" /> + <edge from-layer="5444" from-port="2" to-layer="5445" to-port="1" /> + <edge from-layer="5445" from-port="2" to-layer="5456" to-port="0" /> + <edge from-layer="5445" from-port="2" to-layer="5449" to-port="0" /> + <edge from-layer="5445" from-port="2" to-layer="5493" to-port="0" /> + <edge from-layer="5446" from-port="0" to-layer="5457" to-port="0" /> + <edge from-layer="5447" from-port="0" to-layer="5455" to-port="0" /> + <edge from-layer="5448" from-port="0" to-layer="5449" to-port="1" /> + <edge from-layer="5449" from-port="2" to-layer="5451" to-port="0" /> + <edge from-layer="5450" from-port="0" to-layer="5451" to-port="1" /> + <edge from-layer="5451" from-port="2" to-layer="5453" to-port="0" /> + <edge from-layer="5452" from-port="0" to-layer="5453" to-port="1" /> + <edge from-layer="5453" from-port="2" to-layer="5454" to-port="0" /> + <edge from-layer="5454" from-port="1" to-layer="5455" to-port="1" /> + <edge from-layer="5455" from-port="2" to-layer="5456" to-port="1" /> + <edge from-layer="5456" from-port="2" to-layer="5457" to-port="1" /> + <edge from-layer="5457" from-port="2" to-layer="5468" to-port="0" /> + <edge from-layer="5457" from-port="2" to-layer="5480" to-port="0" /> + <edge from-layer="5458" from-port="0" to-layer="5459" to-port="0" /> + <edge from-layer="5459" from-port="1" to-layer="5462" to-port="0" /> + <edge from-layer="5460" from-port="0" to-layer="5461" to-port="0" /> + <edge from-layer="5461" from-port="1" to-layer="5462" to-port="1" /> + <edge from-layer="5462" from-port="2" to-layer="5464" to-port="0" /> + <edge from-layer="5463" from-port="0" to-layer="5464" to-port="1" /> + <edge from-layer="5464" from-port="2" to-layer="5466" to-port="0" /> + <edge from-layer="5465" from-port="0" to-layer="5466" to-port="1" /> + <edge from-layer="5466" from-port="2" to-layer="5467" to-port="0" /> + <edge from-layer="5467" from-port="1" to-layer="5468" to-port="1" /> + <edge from-layer="5468" from-port="2" to-layer="5469" to-port="0" /> + <edge from-layer="5469" from-port="1" to-layer="5481" to-port="0" /> + <edge from-layer="5470" from-port="0" to-layer="5471" to-port="0" /> + <edge from-layer="5471" from-port="1" to-layer="5474" to-port="0" /> + <edge from-layer="5472" from-port="0" to-layer="5473" to-port="0" /> + <edge from-layer="5473" from-port="1" to-layer="5474" to-port="1" /> + <edge from-layer="5474" from-port="2" to-layer="5476" to-port="0" /> + <edge from-layer="5475" from-port="0" to-layer="5476" to-port="1" /> + <edge from-layer="5476" from-port="2" to-layer="5478" to-port="0" /> + <edge from-layer="5477" from-port="0" to-layer="5478" to-port="1" /> + <edge from-layer="5478" from-port="2" to-layer="5479" to-port="0" /> + <edge from-layer="5479" from-port="1" to-layer="5480" to-port="1" /> + <edge from-layer="5480" from-port="2" to-layer="5481" to-port="1" /> + <edge from-layer="5481" from-port="2" to-layer="5492" to-port="0" /> + <edge from-layer="5482" from-port="0" to-layer="5483" to-port="0" /> + <edge from-layer="5483" from-port="1" to-layer="5486" to-port="0" /> + <edge from-layer="5484" from-port="0" to-layer="5485" to-port="0" /> + <edge from-layer="5485" from-port="1" to-layer="5486" to-port="1" /> + <edge from-layer="5486" from-port="2" to-layer="5488" to-port="0" /> + <edge from-layer="5487" from-port="0" to-layer="5488" to-port="1" /> + <edge from-layer="5488" from-port="2" to-layer="5490" to-port="0" /> + <edge from-layer="5489" from-port="0" to-layer="5490" to-port="1" /> + <edge from-layer="5490" from-port="2" to-layer="5491" to-port="0" /> + <edge from-layer="5491" from-port="1" to-layer="5492" to-port="1" /> + <edge from-layer="5492" from-port="2" to-layer="5493" to-port="1" /> + <edge from-layer="5493" from-port="2" to-layer="5677" to-port="0" /> + <edge from-layer="5493" from-port="2" to-layer="5504" to-port="0" /> + <edge from-layer="5493" from-port="2" to-layer="5497" to-port="0" /> + <edge from-layer="5494" from-port="0" to-layer="5505" to-port="0" /> + <edge from-layer="5495" from-port="0" to-layer="5503" to-port="0" /> + <edge from-layer="5496" from-port="0" to-layer="5497" to-port="1" /> + <edge from-layer="5497" from-port="2" to-layer="5499" to-port="0" /> + <edge from-layer="5498" from-port="0" to-layer="5499" to-port="1" /> + <edge from-layer="5499" from-port="2" to-layer="5501" to-port="0" /> + <edge from-layer="5500" from-port="0" to-layer="5501" to-port="1" /> + <edge from-layer="5501" from-port="2" to-layer="5502" to-port="0" /> + <edge from-layer="5502" from-port="1" to-layer="5503" to-port="1" /> + <edge from-layer="5503" from-port="2" to-layer="5504" to-port="1" /> + <edge from-layer="5504" from-port="2" to-layer="5505" to-port="1" /> + <edge from-layer="5505" from-port="2" to-layer="5516" to-port="0" /> + <edge from-layer="5505" from-port="2" to-layer="5626" to-port="0" /> + <edge from-layer="5505" from-port="2" to-layer="5564" to-port="0" /> + <edge from-layer="5506" from-port="0" to-layer="5507" to-port="0" /> + <edge from-layer="5507" from-port="1" to-layer="5510" to-port="0" /> + <edge from-layer="5508" from-port="0" to-layer="5509" to-port="0" /> + <edge from-layer="5509" from-port="1" to-layer="5510" to-port="1" /> + <edge from-layer="5510" from-port="2" to-layer="5512" to-port="0" /> + <edge from-layer="5511" from-port="0" to-layer="5512" to-port="1" /> + <edge from-layer="5512" from-port="2" to-layer="5514" to-port="0" /> + <edge from-layer="5513" from-port="0" to-layer="5514" to-port="1" /> + <edge from-layer="5514" from-port="2" to-layer="5515" to-port="0" /> + <edge from-layer="5515" from-port="1" to-layer="5516" to-port="1" /> + <edge from-layer="5516" from-port="2" to-layer="5519" to-port="0" /> + <edge from-layer="5517" from-port="0" to-layer="5518" to-port="0" /> + <edge from-layer="5518" from-port="1" to-layer="5519" to-port="1" /> + <edge from-layer="5519" from-port="2" to-layer="5521" to-port="0" /> + <edge from-layer="5520" from-port="0" to-layer="5521" to-port="1" /> + <edge from-layer="5521" from-port="2" to-layer="5523" to-port="0" /> + <edge from-layer="5522" from-port="0" to-layer="5523" to-port="1" /> + <edge from-layer="5523" from-port="2" to-layer="5524" to-port="0" /> + <edge from-layer="5523" from-port="2" to-layer="5525" to-port="0" /> + <edge from-layer="5523" from-port="2" to-layer="5535" to-port="0" /> + <edge from-layer="5523" from-port="2" to-layer="5541" to-port="0" /> + <edge from-layer="5524" from-port="2" to-layer="5544" to-port="0" /> + <edge from-layer="5525" from-port="1" to-layer="5527" to-port="0" /> + <edge from-layer="5526" from-port="0" to-layer="5527" to-port="2" /> + <edge from-layer="5527" from-port="3" to-layer="5528" to-port="0" /> + <edge from-layer="5528" from-port="2" to-layer="5529" to-port="0" /> + <edge from-layer="5529" from-port="1" to-layer="5531" to-port="0" /> + <edge from-layer="5530" from-port="0" to-layer="5531" to-port="1" /> + <edge from-layer="5531" from-port="2" to-layer="5535" to-port="1" /> + <edge from-layer="5531" from-port="2" to-layer="5541" to-port="2" /> + <edge from-layer="5532" from-port="0" to-layer="5535" to-port="2" /> + <edge from-layer="5533" from-port="0" to-layer="5535" to-port="3" /> + <edge from-layer="5534" from-port="0" to-layer="5535" to-port="4" /> + <edge from-layer="5535" from-port="5" to-layer="5537" to-port="0" /> + <edge from-layer="5536" from-port="0" to-layer="5537" to-port="1" /> + <edge from-layer="5537" from-port="2" to-layer="5542" to-port="0" /> + <edge from-layer="5538" from-port="0" to-layer="5541" to-port="1" /> + <edge from-layer="5539" from-port="0" to-layer="5541" to-port="3" /> + <edge from-layer="5540" from-port="0" to-layer="5541" to-port="4" /> + <edge from-layer="5541" from-port="5" to-layer="5542" to-port="1" /> + <edge from-layer="5542" from-port="2" to-layer="5543" to-port="0" /> + <edge from-layer="5543" from-port="2" to-layer="5544" to-port="1" /> + <edge from-layer="5544" from-port="2" to-layer="5661" to-port="0" /> + <edge from-layer="5545" from-port="0" to-layer="5550" to-port="0" /> + <edge from-layer="5546" from-port="0" to-layer="5549" to-port="1" /> + <edge from-layer="5547" from-port="0" to-layer="5549" to-port="2" /> + <edge from-layer="5548" from-port="0" to-layer="5549" to-port="3" /> + <edge from-layer="5549" from-port="4" to-layer="5550" to-port="1" /> + <edge from-layer="5550" from-port="2" to-layer="5551" to-port="0" /> + <edge from-layer="5551" from-port="1" to-layer="5553" to-port="0" /> + <edge from-layer="5552" from-port="0" to-layer="5553" to-port="2" /> + <edge from-layer="5553" from-port="3" to-layer="5649" to-port="0" /> + <edge from-layer="5553" from-port="3" to-layer="5593" to-port="0" /> + <edge from-layer="5554" from-port="0" to-layer="5555" to-port="0" /> + <edge from-layer="5555" from-port="1" to-layer="5558" to-port="0" /> + <edge from-layer="5556" from-port="0" to-layer="5557" to-port="0" /> + <edge from-layer="5557" from-port="1" to-layer="5558" to-port="1" /> + <edge from-layer="5558" from-port="2" to-layer="5560" to-port="0" /> + <edge from-layer="5559" from-port="0" to-layer="5560" to-port="1" /> + <edge from-layer="5560" from-port="2" to-layer="5562" to-port="0" /> + <edge from-layer="5561" from-port="0" to-layer="5562" to-port="1" /> + <edge from-layer="5562" from-port="2" to-layer="5563" to-port="0" /> + <edge from-layer="5563" from-port="1" to-layer="5564" to-port="1" /> + <edge from-layer="5564" from-port="2" to-layer="5567" to-port="0" /> + <edge from-layer="5565" from-port="0" to-layer="5566" to-port="0" /> + <edge from-layer="5566" from-port="1" to-layer="5567" to-port="1" /> + <edge from-layer="5567" from-port="2" to-layer="5569" to-port="0" /> + <edge from-layer="5568" from-port="0" to-layer="5569" to-port="1" /> + <edge from-layer="5569" from-port="2" to-layer="5571" to-port="0" /> + <edge from-layer="5570" from-port="0" to-layer="5571" to-port="1" /> + <edge from-layer="5571" from-port="2" to-layer="5589" to-port="0" /> + <edge from-layer="5571" from-port="2" to-layer="5583" to-port="0" /> + <edge from-layer="5571" from-port="2" to-layer="5573" to-port="0" /> + <edge from-layer="5571" from-port="2" to-layer="5572" to-port="0" /> + <edge from-layer="5572" from-port="2" to-layer="5592" to-port="0" /> + <edge from-layer="5573" from-port="1" to-layer="5575" to-port="0" /> + <edge from-layer="5574" from-port="0" to-layer="5575" to-port="2" /> + <edge from-layer="5575" from-port="3" to-layer="5576" to-port="0" /> + <edge from-layer="5576" from-port="2" to-layer="5577" to-port="0" /> + <edge from-layer="5577" from-port="1" to-layer="5579" to-port="0" /> + <edge from-layer="5578" from-port="0" to-layer="5579" to-port="1" /> + <edge from-layer="5579" from-port="2" to-layer="5589" to-port="2" /> + <edge from-layer="5579" from-port="2" to-layer="5583" to-port="1" /> + <edge from-layer="5580" from-port="0" to-layer="5583" to-port="2" /> + <edge from-layer="5581" from-port="0" to-layer="5583" to-port="3" /> + <edge from-layer="5582" from-port="0" to-layer="5583" to-port="4" /> + <edge from-layer="5583" from-port="5" to-layer="5585" to-port="0" /> + <edge from-layer="5584" from-port="0" to-layer="5585" to-port="1" /> + <edge from-layer="5585" from-port="2" to-layer="5590" to-port="0" /> + <edge from-layer="5586" from-port="0" to-layer="5589" to-port="1" /> + <edge from-layer="5587" from-port="0" to-layer="5589" to-port="3" /> + <edge from-layer="5588" from-port="0" to-layer="5589" to-port="4" /> + <edge from-layer="5589" from-port="5" to-layer="5590" to-port="1" /> + <edge from-layer="5590" from-port="2" to-layer="5591" to-port="0" /> + <edge from-layer="5591" from-port="2" to-layer="5592" to-port="1" /> + <edge from-layer="5592" from-port="2" to-layer="5593" to-port="1" /> + <edge from-layer="5592" from-port="2" to-layer="5653" to-port="0" /> + <edge from-layer="5593" from-port="2" to-layer="11194" to-port="0" /> + <edge from-layer="5593" from-port="2" to-layer="5595" to-port="0" /> + <edge from-layer="5593" from-port="2" to-layer="5594" to-port="0" /> + <edge from-layer="5594" from-port="2" to-layer="5604" to-port="0" /> + <edge from-layer="5595" from-port="1" to-layer="5598" to-port="0" /> + <edge from-layer="5595" from-port="1" to-layer="5602" to-port="0" /> + <edge from-layer="5596" from-port="0" to-layer="5598" to-port="1" /> + <edge from-layer="5597" from-port="0" to-layer="5598" to-port="2" /> + <edge from-layer="5598" from-port="3" to-layer="5603" to-port="0" /> + <edge from-layer="5599" from-port="0" to-layer="5603" to-port="1" /> + <edge from-layer="5600" from-port="0" to-layer="5602" to-port="1" /> + <edge from-layer="5601" from-port="0" to-layer="5602" to-port="2" /> + <edge from-layer="5602" from-port="3" to-layer="5603" to-port="2" /> + <edge from-layer="5603" from-port="3" to-layer="5604" to-port="1" /> + <edge from-layer="5604" from-port="2" to-layer="5606" to-port="0" /> + <edge from-layer="5605" from-port="0" to-layer="5606" to-port="1" /> + <edge from-layer="5606" from-port="2" to-layer="5661" to-port="1" /> + <edge from-layer="5607" from-port="0" to-layer="5612" to-port="0" /> + <edge from-layer="5608" from-port="0" to-layer="5611" to-port="1" /> + <edge from-layer="5609" from-port="0" to-layer="5611" to-port="2" /> + <edge from-layer="5610" from-port="0" to-layer="5611" to-port="3" /> + <edge from-layer="5611" from-port="4" to-layer="5612" to-port="1" /> + <edge from-layer="5612" from-port="2" to-layer="5613" to-port="0" /> + <edge from-layer="5613" from-port="1" to-layer="5615" to-port="0" /> + <edge from-layer="5614" from-port="0" to-layer="5615" to-port="2" /> + <edge from-layer="5615" from-port="3" to-layer="5634" to-port="0" /> + <edge from-layer="5616" from-port="0" to-layer="5617" to-port="0" /> + <edge from-layer="5617" from-port="1" to-layer="5620" to-port="0" /> + <edge from-layer="5618" from-port="0" to-layer="5619" to-port="0" /> + <edge from-layer="5619" from-port="1" to-layer="5620" to-port="1" /> + <edge from-layer="5620" from-port="2" to-layer="5622" to-port="0" /> + <edge from-layer="5621" from-port="0" to-layer="5622" to-port="1" /> + <edge from-layer="5622" from-port="2" to-layer="5624" to-port="0" /> + <edge from-layer="5623" from-port="0" to-layer="5624" to-port="1" /> + <edge from-layer="5624" from-port="2" to-layer="5625" to-port="0" /> + <edge from-layer="5625" from-port="1" to-layer="5626" to-port="1" /> + <edge from-layer="5626" from-port="2" to-layer="5629" to-port="0" /> + <edge from-layer="5627" from-port="0" to-layer="5628" to-port="0" /> + <edge from-layer="5628" from-port="1" to-layer="5629" to-port="1" /> + <edge from-layer="5629" from-port="2" to-layer="5631" to-port="0" /> + <edge from-layer="5630" from-port="0" to-layer="5631" to-port="1" /> + <edge from-layer="5631" from-port="2" to-layer="5633" to-port="0" /> + <edge from-layer="5632" from-port="0" to-layer="5633" to-port="1" /> + <edge from-layer="5633" from-port="2" to-layer="5634" to-port="1" /> + <edge from-layer="5634" from-port="2" to-layer="5636" to-port="0" /> + <edge from-layer="5634" from-port="2" to-layer="5635" to-port="0" /> + <edge from-layer="5634" from-port="2" to-layer="11193" to-port="0" /> + <edge from-layer="5635" from-port="2" to-layer="5645" to-port="0" /> + <edge from-layer="5636" from-port="1" to-layer="5643" to-port="0" /> + <edge from-layer="5636" from-port="1" to-layer="5639" to-port="0" /> + <edge from-layer="5637" from-port="0" to-layer="5639" to-port="1" /> + <edge from-layer="5638" from-port="0" to-layer="5639" to-port="2" /> + <edge from-layer="5639" from-port="3" to-layer="5644" to-port="1" /> + <edge from-layer="5640" from-port="0" to-layer="5644" to-port="2" /> + <edge from-layer="5641" from-port="0" to-layer="5643" to-port="1" /> + <edge from-layer="5642" from-port="0" to-layer="5643" to-port="2" /> + <edge from-layer="5643" from-port="3" to-layer="5644" to-port="3" /> + <edge from-layer="5644" from-port="4" to-layer="5645" to-port="1" /> + <edge from-layer="5645" from-port="2" to-layer="5647" to-port="0" /> + <edge from-layer="5646" from-port="0" to-layer="5647" to-port="1" /> + <edge from-layer="5647" from-port="2" to-layer="5661" to-port="2" /> + <edge from-layer="5648" from-port="0" to-layer="5660" to-port="1" /> + <edge from-layer="5649" from-port="1" to-layer="5652" to-port="0" /> + <edge from-layer="5650" from-port="0" to-layer="5652" to-port="1" /> + <edge from-layer="5651" from-port="0" to-layer="5652" to-port="2" /> + <edge from-layer="5652" from-port="3" to-layer="5657" to-port="0" /> + <edge from-layer="5653" from-port="1" to-layer="5656" to-port="0" /> + <edge from-layer="5654" from-port="0" to-layer="5656" to-port="1" /> + <edge from-layer="5655" from-port="0" to-layer="5656" to-port="2" /> + <edge from-layer="5656" from-port="3" to-layer="5657" to-port="1" /> + <edge from-layer="5657" from-port="2" to-layer="5660" to-port="2" /> + <edge from-layer="5658" from-port="0" to-layer="5660" to-port="3" /> + <edge from-layer="5659" from-port="0" to-layer="5660" to-port="4" /> + <edge from-layer="5660" from-port="5" to-layer="5661" to-port="3" /> + <edge from-layer="5661" from-port="4" to-layer="5663" to-port="0" /> + <edge from-layer="5662" from-port="0" to-layer="5663" to-port="1" /> + <edge from-layer="5663" from-port="2" to-layer="5665" to-port="0" /> + <edge from-layer="5664" from-port="0" to-layer="5665" to-port="1" /> + <edge from-layer="5665" from-port="2" to-layer="5676" to-port="0" /> + <edge from-layer="5666" from-port="0" to-layer="5667" to-port="0" /> + <edge from-layer="5667" from-port="1" to-layer="5670" to-port="0" /> + <edge from-layer="5668" from-port="0" to-layer="5669" to-port="0" /> + <edge from-layer="5669" from-port="1" to-layer="5670" to-port="1" /> + <edge from-layer="5670" from-port="2" to-layer="5672" to-port="0" /> + <edge from-layer="5671" from-port="0" to-layer="5672" to-port="1" /> + <edge from-layer="5672" from-port="2" to-layer="5674" to-port="0" /> + <edge from-layer="5673" from-port="0" to-layer="5674" to-port="1" /> + <edge from-layer="5674" from-port="2" to-layer="5675" to-port="0" /> + <edge from-layer="5675" from-port="1" to-layer="5676" to-port="1" /> + <edge from-layer="5676" from-port="2" to-layer="5677" to-port="1" /> + <edge from-layer="5677" from-port="2" to-layer="5688" to-port="0" /> + <edge from-layer="5677" from-port="2" to-layer="5725" to-port="0" /> + <edge from-layer="5677" from-port="2" to-layer="5681" to-port="0" /> + <edge from-layer="5678" from-port="0" to-layer="5689" to-port="0" /> + <edge from-layer="5679" from-port="0" to-layer="5687" to-port="0" /> + <edge from-layer="5680" from-port="0" to-layer="5681" to-port="1" /> + <edge from-layer="5681" from-port="2" to-layer="5683" to-port="0" /> + <edge from-layer="5682" from-port="0" to-layer="5683" to-port="1" /> + <edge from-layer="5683" from-port="2" to-layer="5685" to-port="0" /> + <edge from-layer="5684" from-port="0" to-layer="5685" to-port="1" /> + <edge from-layer="5685" from-port="2" to-layer="5686" to-port="0" /> + <edge from-layer="5686" from-port="1" to-layer="5687" to-port="1" /> + <edge from-layer="5687" from-port="2" to-layer="5688" to-port="1" /> + <edge from-layer="5688" from-port="2" to-layer="5689" to-port="1" /> + <edge from-layer="5689" from-port="2" to-layer="5700" to-port="0" /> + <edge from-layer="5689" from-port="2" to-layer="5712" to-port="0" /> + <edge from-layer="5690" from-port="0" to-layer="5691" to-port="0" /> + <edge from-layer="5691" from-port="1" to-layer="5694" to-port="0" /> + <edge from-layer="5692" from-port="0" to-layer="5693" to-port="0" /> + <edge from-layer="5693" from-port="1" to-layer="5694" to-port="1" /> + <edge from-layer="5694" from-port="2" to-layer="5696" to-port="0" /> + <edge from-layer="5695" from-port="0" to-layer="5696" to-port="1" /> + <edge from-layer="5696" from-port="2" to-layer="5698" to-port="0" /> + <edge from-layer="5697" from-port="0" to-layer="5698" to-port="1" /> + <edge from-layer="5698" from-port="2" to-layer="5699" to-port="0" /> + <edge from-layer="5699" from-port="1" to-layer="5700" to-port="1" /> + <edge from-layer="5700" from-port="2" to-layer="5701" to-port="0" /> + <edge from-layer="5701" from-port="1" to-layer="5713" to-port="0" /> + <edge from-layer="5702" from-port="0" to-layer="5703" to-port="0" /> + <edge from-layer="5703" from-port="1" to-layer="5706" to-port="0" /> + <edge from-layer="5704" from-port="0" to-layer="5705" to-port="0" /> + <edge from-layer="5705" from-port="1" to-layer="5706" to-port="1" /> + <edge from-layer="5706" from-port="2" to-layer="5708" to-port="0" /> + <edge from-layer="5707" from-port="0" to-layer="5708" to-port="1" /> + <edge from-layer="5708" from-port="2" to-layer="5710" to-port="0" /> + <edge from-layer="5709" from-port="0" to-layer="5710" to-port="1" /> + <edge from-layer="5710" from-port="2" to-layer="5711" to-port="0" /> + <edge from-layer="5711" from-port="1" to-layer="5712" to-port="1" /> + <edge from-layer="5712" from-port="2" to-layer="5713" to-port="1" /> + <edge from-layer="5713" from-port="2" to-layer="5724" to-port="0" /> + <edge from-layer="5714" from-port="0" to-layer="5715" to-port="0" /> + <edge from-layer="5715" from-port="1" to-layer="5718" to-port="0" /> + <edge from-layer="5716" from-port="0" to-layer="5717" to-port="0" /> + <edge from-layer="5717" from-port="1" to-layer="5718" to-port="1" /> + <edge from-layer="5718" from-port="2" to-layer="5720" to-port="0" /> + <edge from-layer="5719" from-port="0" to-layer="5720" to-port="1" /> + <edge from-layer="5720" from-port="2" to-layer="5722" to-port="0" /> + <edge from-layer="5721" from-port="0" to-layer="5722" to-port="1" /> + <edge from-layer="5722" from-port="2" to-layer="5723" to-port="0" /> + <edge from-layer="5723" from-port="1" to-layer="5724" to-port="1" /> + <edge from-layer="5724" from-port="2" to-layer="5725" to-port="1" /> + <edge from-layer="5725" from-port="2" to-layer="5736" to-port="0" /> + <edge from-layer="5725" from-port="2" to-layer="5729" to-port="0" /> + <edge from-layer="5725" from-port="2" to-layer="5909" to-port="0" /> + <edge from-layer="5726" from-port="0" to-layer="5737" to-port="0" /> + <edge from-layer="5727" from-port="0" to-layer="5735" to-port="0" /> + <edge from-layer="5728" from-port="0" to-layer="5729" to-port="1" /> + <edge from-layer="5729" from-port="2" to-layer="5731" to-port="0" /> + <edge from-layer="5730" from-port="0" to-layer="5731" to-port="1" /> + <edge from-layer="5731" from-port="2" to-layer="5733" to-port="0" /> + <edge from-layer="5732" from-port="0" to-layer="5733" to-port="1" /> + <edge from-layer="5733" from-port="2" to-layer="5734" to-port="0" /> + <edge from-layer="5734" from-port="1" to-layer="5735" to-port="1" /> + <edge from-layer="5735" from-port="2" to-layer="5736" to-port="1" /> + <edge from-layer="5736" from-port="2" to-layer="5737" to-port="1" /> + <edge from-layer="5737" from-port="2" to-layer="5748" to-port="0" /> + <edge from-layer="5737" from-port="2" to-layer="5796" to-port="0" /> + <edge from-layer="5737" from-port="2" to-layer="5858" to-port="0" /> + <edge from-layer="5738" from-port="0" to-layer="5739" to-port="0" /> + <edge from-layer="5739" from-port="1" to-layer="5742" to-port="0" /> + <edge from-layer="5740" from-port="0" to-layer="5741" to-port="0" /> + <edge from-layer="5741" from-port="1" to-layer="5742" to-port="1" /> + <edge from-layer="5742" from-port="2" to-layer="5744" to-port="0" /> + <edge from-layer="5743" from-port="0" to-layer="5744" to-port="1" /> + <edge from-layer="5744" from-port="2" to-layer="5746" to-port="0" /> + <edge from-layer="5745" from-port="0" to-layer="5746" to-port="1" /> + <edge from-layer="5746" from-port="2" to-layer="5747" to-port="0" /> + <edge from-layer="5747" from-port="1" to-layer="5748" to-port="1" /> + <edge from-layer="5748" from-port="2" to-layer="5751" to-port="0" /> + <edge from-layer="5749" from-port="0" to-layer="5750" to-port="0" /> + <edge from-layer="5750" from-port="1" to-layer="5751" to-port="1" /> + <edge from-layer="5751" from-port="2" to-layer="5753" to-port="0" /> + <edge from-layer="5752" from-port="0" to-layer="5753" to-port="1" /> + <edge from-layer="5753" from-port="2" to-layer="5755" to-port="0" /> + <edge from-layer="5754" from-port="0" to-layer="5755" to-port="1" /> + <edge from-layer="5755" from-port="2" to-layer="5756" to-port="0" /> + <edge from-layer="5755" from-port="2" to-layer="5757" to-port="0" /> + <edge from-layer="5755" from-port="2" to-layer="5773" to-port="0" /> + <edge from-layer="5755" from-port="2" to-layer="5767" to-port="0" /> + <edge from-layer="5756" from-port="2" to-layer="5776" to-port="0" /> + <edge from-layer="5757" from-port="1" to-layer="5759" to-port="0" /> + <edge from-layer="5758" from-port="0" to-layer="5759" to-port="2" /> + <edge from-layer="5759" from-port="3" to-layer="5760" to-port="0" /> + <edge from-layer="5760" from-port="2" to-layer="5761" to-port="0" /> + <edge from-layer="5761" from-port="1" to-layer="5763" to-port="0" /> + <edge from-layer="5762" from-port="0" to-layer="5763" to-port="1" /> + <edge from-layer="5763" from-port="2" to-layer="5767" to-port="1" /> + <edge from-layer="5763" from-port="2" to-layer="5773" to-port="2" /> + <edge from-layer="5764" from-port="0" to-layer="5767" to-port="2" /> + <edge from-layer="5765" from-port="0" to-layer="5767" to-port="3" /> + <edge from-layer="5766" from-port="0" to-layer="5767" to-port="4" /> + <edge from-layer="5767" from-port="5" to-layer="5769" to-port="0" /> + <edge from-layer="5768" from-port="0" to-layer="5769" to-port="1" /> + <edge from-layer="5769" from-port="2" to-layer="5774" to-port="0" /> + <edge from-layer="5770" from-port="0" to-layer="5773" to-port="1" /> + <edge from-layer="5771" from-port="0" to-layer="5773" to-port="3" /> + <edge from-layer="5772" from-port="0" to-layer="5773" to-port="4" /> + <edge from-layer="5773" from-port="5" to-layer="5774" to-port="1" /> + <edge from-layer="5774" from-port="2" to-layer="5775" to-port="0" /> + <edge from-layer="5775" from-port="2" to-layer="5776" to-port="1" /> + <edge from-layer="5776" from-port="2" to-layer="5893" to-port="0" /> + <edge from-layer="5777" from-port="0" to-layer="5782" to-port="0" /> + <edge from-layer="5778" from-port="0" to-layer="5781" to-port="1" /> + <edge from-layer="5779" from-port="0" to-layer="5781" to-port="2" /> + <edge from-layer="5780" from-port="0" to-layer="5781" to-port="3" /> + <edge from-layer="5781" from-port="4" to-layer="5782" to-port="1" /> + <edge from-layer="5782" from-port="2" to-layer="5783" to-port="0" /> + <edge from-layer="5783" from-port="1" to-layer="5785" to-port="0" /> + <edge from-layer="5784" from-port="0" to-layer="5785" to-port="2" /> + <edge from-layer="5785" from-port="3" to-layer="5881" to-port="0" /> + <edge from-layer="5785" from-port="3" to-layer="5825" to-port="0" /> + <edge from-layer="5786" from-port="0" to-layer="5787" to-port="0" /> + <edge from-layer="5787" from-port="1" to-layer="5790" to-port="0" /> + <edge from-layer="5788" from-port="0" to-layer="5789" to-port="0" /> + <edge from-layer="5789" from-port="1" to-layer="5790" to-port="1" /> + <edge from-layer="5790" from-port="2" to-layer="5792" to-port="0" /> + <edge from-layer="5791" from-port="0" to-layer="5792" to-port="1" /> + <edge from-layer="5792" from-port="2" to-layer="5794" to-port="0" /> + <edge from-layer="5793" from-port="0" to-layer="5794" to-port="1" /> + <edge from-layer="5794" from-port="2" to-layer="5795" to-port="0" /> + <edge from-layer="5795" from-port="1" to-layer="5796" to-port="1" /> + <edge from-layer="5796" from-port="2" to-layer="5799" to-port="0" /> + <edge from-layer="5797" from-port="0" to-layer="5798" to-port="0" /> + <edge from-layer="5798" from-port="1" to-layer="5799" to-port="1" /> + <edge from-layer="5799" from-port="2" to-layer="5801" to-port="0" /> + <edge from-layer="5800" from-port="0" to-layer="5801" to-port="1" /> + <edge from-layer="5801" from-port="2" to-layer="5803" to-port="0" /> + <edge from-layer="5802" from-port="0" to-layer="5803" to-port="1" /> + <edge from-layer="5803" from-port="2" to-layer="5821" to-port="0" /> + <edge from-layer="5803" from-port="2" to-layer="5815" to-port="0" /> + <edge from-layer="5803" from-port="2" to-layer="5805" to-port="0" /> + <edge from-layer="5803" from-port="2" to-layer="5804" to-port="0" /> + <edge from-layer="5804" from-port="2" to-layer="5824" to-port="0" /> + <edge from-layer="5805" from-port="1" to-layer="5807" to-port="0" /> + <edge from-layer="5806" from-port="0" to-layer="5807" to-port="2" /> + <edge from-layer="5807" from-port="3" to-layer="5808" to-port="0" /> + <edge from-layer="5808" from-port="2" to-layer="5809" to-port="0" /> + <edge from-layer="5809" from-port="1" to-layer="5811" to-port="0" /> + <edge from-layer="5810" from-port="0" to-layer="5811" to-port="1" /> + <edge from-layer="5811" from-port="2" to-layer="5821" to-port="2" /> + <edge from-layer="5811" from-port="2" to-layer="5815" to-port="1" /> + <edge from-layer="5812" from-port="0" to-layer="5815" to-port="2" /> + <edge from-layer="5813" from-port="0" to-layer="5815" to-port="3" /> + <edge from-layer="5814" from-port="0" to-layer="5815" to-port="4" /> + <edge from-layer="5815" from-port="5" to-layer="5817" to-port="0" /> + <edge from-layer="5816" from-port="0" to-layer="5817" to-port="1" /> + <edge from-layer="5817" from-port="2" to-layer="5822" to-port="0" /> + <edge from-layer="5818" from-port="0" to-layer="5821" to-port="1" /> + <edge from-layer="5819" from-port="0" to-layer="5821" to-port="3" /> + <edge from-layer="5820" from-port="0" to-layer="5821" to-port="4" /> + <edge from-layer="5821" from-port="5" to-layer="5822" to-port="1" /> + <edge from-layer="5822" from-port="2" to-layer="5823" to-port="0" /> + <edge from-layer="5823" from-port="2" to-layer="5824" to-port="1" /> + <edge from-layer="5824" from-port="2" to-layer="5885" to-port="0" /> + <edge from-layer="5824" from-port="2" to-layer="5825" to-port="1" /> + <edge from-layer="5825" from-port="2" to-layer="11192" to-port="0" /> + <edge from-layer="5825" from-port="2" to-layer="5826" to-port="0" /> + <edge from-layer="5825" from-port="2" to-layer="5827" to-port="0" /> + <edge from-layer="5826" from-port="2" to-layer="5836" to-port="0" /> + <edge from-layer="5827" from-port="1" to-layer="5834" to-port="0" /> + <edge from-layer="5827" from-port="1" to-layer="5830" to-port="0" /> + <edge from-layer="5828" from-port="0" to-layer="5830" to-port="1" /> + <edge from-layer="5829" from-port="0" to-layer="5830" to-port="2" /> + <edge from-layer="5830" from-port="3" to-layer="5835" to-port="0" /> + <edge from-layer="5831" from-port="0" to-layer="5835" to-port="1" /> + <edge from-layer="5832" from-port="0" to-layer="5834" to-port="1" /> + <edge from-layer="5833" from-port="0" to-layer="5834" to-port="2" /> + <edge from-layer="5834" from-port="3" to-layer="5835" to-port="2" /> + <edge from-layer="5835" from-port="3" to-layer="5836" to-port="1" /> + <edge from-layer="5836" from-port="2" to-layer="5838" to-port="0" /> + <edge from-layer="5837" from-port="0" to-layer="5838" to-port="1" /> + <edge from-layer="5838" from-port="2" to-layer="5893" to-port="1" /> + <edge from-layer="5839" from-port="0" to-layer="5844" to-port="0" /> + <edge from-layer="5840" from-port="0" to-layer="5843" to-port="1" /> + <edge from-layer="5841" from-port="0" to-layer="5843" to-port="2" /> + <edge from-layer="5842" from-port="0" to-layer="5843" to-port="3" /> + <edge from-layer="5843" from-port="4" to-layer="5844" to-port="1" /> + <edge from-layer="5844" from-port="2" to-layer="5845" to-port="0" /> + <edge from-layer="5845" from-port="1" to-layer="5847" to-port="0" /> + <edge from-layer="5846" from-port="0" to-layer="5847" to-port="2" /> + <edge from-layer="5847" from-port="3" to-layer="5866" to-port="0" /> + <edge from-layer="5848" from-port="0" to-layer="5849" to-port="0" /> + <edge from-layer="5849" from-port="1" to-layer="5852" to-port="0" /> + <edge from-layer="5850" from-port="0" to-layer="5851" to-port="0" /> + <edge from-layer="5851" from-port="1" to-layer="5852" to-port="1" /> + <edge from-layer="5852" from-port="2" to-layer="5854" to-port="0" /> + <edge from-layer="5853" from-port="0" to-layer="5854" to-port="1" /> + <edge from-layer="5854" from-port="2" to-layer="5856" to-port="0" /> + <edge from-layer="5855" from-port="0" to-layer="5856" to-port="1" /> + <edge from-layer="5856" from-port="2" to-layer="5857" to-port="0" /> + <edge from-layer="5857" from-port="1" to-layer="5858" to-port="1" /> + <edge from-layer="5858" from-port="2" to-layer="5861" to-port="0" /> + <edge from-layer="5859" from-port="0" to-layer="5860" to-port="0" /> + <edge from-layer="5860" from-port="1" to-layer="5861" to-port="1" /> + <edge from-layer="5861" from-port="2" to-layer="5863" to-port="0" /> + <edge from-layer="5862" from-port="0" to-layer="5863" to-port="1" /> + <edge from-layer="5863" from-port="2" to-layer="5865" to-port="0" /> + <edge from-layer="5864" from-port="0" to-layer="5865" to-port="1" /> + <edge from-layer="5865" from-port="2" to-layer="5866" to-port="1" /> + <edge from-layer="5866" from-port="2" to-layer="11191" to-port="0" /> + <edge from-layer="5866" from-port="2" to-layer="5867" to-port="0" /> + <edge from-layer="5866" from-port="2" to-layer="5868" to-port="0" /> + <edge from-layer="5867" from-port="2" to-layer="5877" to-port="0" /> + <edge from-layer="5868" from-port="1" to-layer="5871" to-port="0" /> + <edge from-layer="5868" from-port="1" to-layer="5875" to-port="0" /> + <edge from-layer="5869" from-port="0" to-layer="5871" to-port="1" /> + <edge from-layer="5870" from-port="0" to-layer="5871" to-port="2" /> + <edge from-layer="5871" from-port="3" to-layer="5876" to-port="1" /> + <edge from-layer="5872" from-port="0" to-layer="5876" to-port="2" /> + <edge from-layer="5873" from-port="0" to-layer="5875" to-port="1" /> + <edge from-layer="5874" from-port="0" to-layer="5875" to-port="2" /> + <edge from-layer="5875" from-port="3" to-layer="5876" to-port="3" /> + <edge from-layer="5876" from-port="4" to-layer="5877" to-port="1" /> + <edge from-layer="5877" from-port="2" to-layer="5879" to-port="0" /> + <edge from-layer="5878" from-port="0" to-layer="5879" to-port="1" /> + <edge from-layer="5879" from-port="2" to-layer="5893" to-port="2" /> + <edge from-layer="5880" from-port="0" to-layer="5892" to-port="1" /> + <edge from-layer="5881" from-port="1" to-layer="5884" to-port="0" /> + <edge from-layer="5882" from-port="0" to-layer="5884" to-port="1" /> + <edge from-layer="5883" from-port="0" to-layer="5884" to-port="2" /> + <edge from-layer="5884" from-port="3" to-layer="5889" to-port="0" /> + <edge from-layer="5885" from-port="1" to-layer="5888" to-port="0" /> + <edge from-layer="5886" from-port="0" to-layer="5888" to-port="1" /> + <edge from-layer="5887" from-port="0" to-layer="5888" to-port="2" /> + <edge from-layer="5888" from-port="3" to-layer="5889" to-port="1" /> + <edge from-layer="5889" from-port="2" to-layer="5892" to-port="2" /> + <edge from-layer="5890" from-port="0" to-layer="5892" to-port="3" /> + <edge from-layer="5891" from-port="0" to-layer="5892" to-port="4" /> + <edge from-layer="5892" from-port="5" to-layer="5893" to-port="3" /> + <edge from-layer="5893" from-port="4" to-layer="5895" to-port="0" /> + <edge from-layer="5894" from-port="0" to-layer="5895" to-port="1" /> + <edge from-layer="5895" from-port="2" to-layer="5897" to-port="0" /> + <edge from-layer="5896" from-port="0" to-layer="5897" to-port="1" /> + <edge from-layer="5897" from-port="2" to-layer="5908" to-port="0" /> + <edge from-layer="5898" from-port="0" to-layer="5899" to-port="0" /> + <edge from-layer="5899" from-port="1" to-layer="5902" to-port="0" /> + <edge from-layer="5900" from-port="0" to-layer="5901" to-port="0" /> + <edge from-layer="5901" from-port="1" to-layer="5902" to-port="1" /> + <edge from-layer="5902" from-port="2" to-layer="5904" to-port="0" /> + <edge from-layer="5903" from-port="0" to-layer="5904" to-port="1" /> + <edge from-layer="5904" from-port="2" to-layer="5906" to-port="0" /> + <edge from-layer="5905" from-port="0" to-layer="5906" to-port="1" /> + <edge from-layer="5906" from-port="2" to-layer="5907" to-port="0" /> + <edge from-layer="5907" from-port="1" to-layer="5908" to-port="1" /> + <edge from-layer="5908" from-port="2" to-layer="5909" to-port="1" /> + <edge from-layer="5909" from-port="2" to-layer="5957" to-port="0" /> + <edge from-layer="5909" from-port="2" to-layer="5920" to-port="0" /> + <edge from-layer="5909" from-port="2" to-layer="5913" to-port="0" /> + <edge from-layer="5910" from-port="0" to-layer="5921" to-port="0" /> + <edge from-layer="5911" from-port="0" to-layer="5919" to-port="0" /> + <edge from-layer="5912" from-port="0" to-layer="5913" to-port="1" /> + <edge from-layer="5913" from-port="2" to-layer="5915" to-port="0" /> + <edge from-layer="5914" from-port="0" to-layer="5915" to-port="1" /> + <edge from-layer="5915" from-port="2" to-layer="5917" to-port="0" /> + <edge from-layer="5916" from-port="0" to-layer="5917" to-port="1" /> + <edge from-layer="5917" from-port="2" to-layer="5918" to-port="0" /> + <edge from-layer="5918" from-port="1" to-layer="5919" to-port="1" /> + <edge from-layer="5919" from-port="2" to-layer="5920" to-port="1" /> + <edge from-layer="5920" from-port="2" to-layer="5921" to-port="1" /> + <edge from-layer="5921" from-port="2" to-layer="5932" to-port="0" /> + <edge from-layer="5921" from-port="2" to-layer="5944" to-port="0" /> + <edge from-layer="5922" from-port="0" to-layer="5923" to-port="0" /> + <edge from-layer="5923" from-port="1" to-layer="5926" to-port="0" /> + <edge from-layer="5924" from-port="0" to-layer="5925" to-port="0" /> + <edge from-layer="5925" from-port="1" to-layer="5926" to-port="1" /> + <edge from-layer="5926" from-port="2" to-layer="5928" to-port="0" /> + <edge from-layer="5927" from-port="0" to-layer="5928" to-port="1" /> + <edge from-layer="5928" from-port="2" to-layer="5930" to-port="0" /> + <edge from-layer="5929" from-port="0" to-layer="5930" to-port="1" /> + <edge from-layer="5930" from-port="2" to-layer="5931" to-port="0" /> + <edge from-layer="5931" from-port="1" to-layer="5932" to-port="1" /> + <edge from-layer="5932" from-port="2" to-layer="5933" to-port="0" /> + <edge from-layer="5933" from-port="1" to-layer="5945" to-port="0" /> + <edge from-layer="5934" from-port="0" to-layer="5935" to-port="0" /> + <edge from-layer="5935" from-port="1" to-layer="5938" to-port="0" /> + <edge from-layer="5936" from-port="0" to-layer="5937" to-port="0" /> + <edge from-layer="5937" from-port="1" to-layer="5938" to-port="1" /> + <edge from-layer="5938" from-port="2" to-layer="5940" to-port="0" /> + <edge from-layer="5939" from-port="0" to-layer="5940" to-port="1" /> + <edge from-layer="5940" from-port="2" to-layer="5942" to-port="0" /> + <edge from-layer="5941" from-port="0" to-layer="5942" to-port="1" /> + <edge from-layer="5942" from-port="2" to-layer="5943" to-port="0" /> + <edge from-layer="5943" from-port="1" to-layer="5944" to-port="1" /> + <edge from-layer="5944" from-port="2" to-layer="5945" to-port="1" /> + <edge from-layer="5945" from-port="2" to-layer="5956" to-port="0" /> + <edge from-layer="5946" from-port="0" to-layer="5947" to-port="0" /> + <edge from-layer="5947" from-port="1" to-layer="5950" to-port="0" /> + <edge from-layer="5948" from-port="0" to-layer="5949" to-port="0" /> + <edge from-layer="5949" from-port="1" to-layer="5950" to-port="1" /> + <edge from-layer="5950" from-port="2" to-layer="5952" to-port="0" /> + <edge from-layer="5951" from-port="0" to-layer="5952" to-port="1" /> + <edge from-layer="5952" from-port="2" to-layer="5954" to-port="0" /> + <edge from-layer="5953" from-port="0" to-layer="5954" to-port="1" /> + <edge from-layer="5954" from-port="2" to-layer="5955" to-port="0" /> + <edge from-layer="5955" from-port="1" to-layer="5956" to-port="1" /> + <edge from-layer="5956" from-port="2" to-layer="5957" to-port="1" /> + <edge from-layer="5957" from-port="2" to-layer="6141" to-port="0" /> + <edge from-layer="5957" from-port="2" to-layer="5968" to-port="0" /> + <edge from-layer="5957" from-port="2" to-layer="5961" to-port="0" /> + <edge from-layer="5958" from-port="0" to-layer="5969" to-port="0" /> + <edge from-layer="5959" from-port="0" to-layer="5967" to-port="0" /> + <edge from-layer="5960" from-port="0" to-layer="5961" to-port="1" /> + <edge from-layer="5961" from-port="2" to-layer="5963" to-port="0" /> + <edge from-layer="5962" from-port="0" to-layer="5963" to-port="1" /> + <edge from-layer="5963" from-port="2" to-layer="5965" to-port="0" /> + <edge from-layer="5964" from-port="0" to-layer="5965" to-port="1" /> + <edge from-layer="5965" from-port="2" to-layer="5966" to-port="0" /> + <edge from-layer="5966" from-port="1" to-layer="5967" to-port="1" /> + <edge from-layer="5967" from-port="2" to-layer="5968" to-port="1" /> + <edge from-layer="5968" from-port="2" to-layer="5969" to-port="1" /> + <edge from-layer="5969" from-port="2" to-layer="6090" to-port="0" /> + <edge from-layer="5969" from-port="2" to-layer="6028" to-port="0" /> + <edge from-layer="5969" from-port="2" to-layer="5980" to-port="0" /> + <edge from-layer="5970" from-port="0" to-layer="5971" to-port="0" /> + <edge from-layer="5971" from-port="1" to-layer="5974" to-port="0" /> + <edge from-layer="5972" from-port="0" to-layer="5973" to-port="0" /> + <edge from-layer="5973" from-port="1" to-layer="5974" to-port="1" /> + <edge from-layer="5974" from-port="2" to-layer="5976" to-port="0" /> + <edge from-layer="5975" from-port="0" to-layer="5976" to-port="1" /> + <edge from-layer="5976" from-port="2" to-layer="5978" to-port="0" /> + <edge from-layer="5977" from-port="0" to-layer="5978" to-port="1" /> + <edge from-layer="5978" from-port="2" to-layer="5979" to-port="0" /> + <edge from-layer="5979" from-port="1" to-layer="5980" to-port="1" /> + <edge from-layer="5980" from-port="2" to-layer="5983" to-port="0" /> + <edge from-layer="5981" from-port="0" to-layer="5982" to-port="0" /> + <edge from-layer="5982" from-port="1" to-layer="5983" to-port="1" /> + <edge from-layer="5983" from-port="2" to-layer="5985" to-port="0" /> + <edge from-layer="5984" from-port="0" to-layer="5985" to-port="1" /> + <edge from-layer="5985" from-port="2" to-layer="5987" to-port="0" /> + <edge from-layer="5986" from-port="0" to-layer="5987" to-port="1" /> + <edge from-layer="5987" from-port="2" to-layer="6005" to-port="0" /> + <edge from-layer="5987" from-port="2" to-layer="5999" to-port="0" /> + <edge from-layer="5987" from-port="2" to-layer="5988" to-port="0" /> + <edge from-layer="5987" from-port="2" to-layer="5989" to-port="0" /> + <edge from-layer="5988" from-port="2" to-layer="6008" to-port="0" /> + <edge from-layer="5989" from-port="1" to-layer="5991" to-port="0" /> + <edge from-layer="5990" from-port="0" to-layer="5991" to-port="2" /> + <edge from-layer="5991" from-port="3" to-layer="5992" to-port="0" /> + <edge from-layer="5992" from-port="2" to-layer="5993" to-port="0" /> + <edge from-layer="5993" from-port="1" to-layer="5995" to-port="0" /> + <edge from-layer="5994" from-port="0" to-layer="5995" to-port="1" /> + <edge from-layer="5995" from-port="2" to-layer="6005" to-port="2" /> + <edge from-layer="5995" from-port="2" to-layer="5999" to-port="1" /> + <edge from-layer="5996" from-port="0" to-layer="5999" to-port="2" /> + <edge from-layer="5997" from-port="0" to-layer="5999" to-port="3" /> + <edge from-layer="5998" from-port="0" to-layer="5999" to-port="4" /> + <edge from-layer="5999" from-port="5" to-layer="6001" to-port="0" /> + <edge from-layer="6000" from-port="0" to-layer="6001" to-port="1" /> + <edge from-layer="6001" from-port="2" to-layer="6006" to-port="0" /> + <edge from-layer="6002" from-port="0" to-layer="6005" to-port="1" /> + <edge from-layer="6003" from-port="0" to-layer="6005" to-port="3" /> + <edge from-layer="6004" from-port="0" to-layer="6005" to-port="4" /> + <edge from-layer="6005" from-port="5" to-layer="6006" to-port="1" /> + <edge from-layer="6006" from-port="2" to-layer="6007" to-port="0" /> + <edge from-layer="6007" from-port="2" to-layer="6008" to-port="1" /> + <edge from-layer="6008" from-port="2" to-layer="6125" to-port="0" /> + <edge from-layer="6009" from-port="0" to-layer="6014" to-port="0" /> + <edge from-layer="6010" from-port="0" to-layer="6013" to-port="1" /> + <edge from-layer="6011" from-port="0" to-layer="6013" to-port="2" /> + <edge from-layer="6012" from-port="0" to-layer="6013" to-port="3" /> + <edge from-layer="6013" from-port="4" to-layer="6014" to-port="1" /> + <edge from-layer="6014" from-port="2" to-layer="6015" to-port="0" /> + <edge from-layer="6015" from-port="1" to-layer="6017" to-port="0" /> + <edge from-layer="6016" from-port="0" to-layer="6017" to-port="2" /> + <edge from-layer="6017" from-port="3" to-layer="6057" to-port="0" /> + <edge from-layer="6017" from-port="3" to-layer="6113" to-port="0" /> + <edge from-layer="6018" from-port="0" to-layer="6019" to-port="0" /> + <edge from-layer="6019" from-port="1" to-layer="6022" to-port="0" /> + <edge from-layer="6020" from-port="0" to-layer="6021" to-port="0" /> + <edge from-layer="6021" from-port="1" to-layer="6022" to-port="1" /> + <edge from-layer="6022" from-port="2" to-layer="6024" to-port="0" /> + <edge from-layer="6023" from-port="0" to-layer="6024" to-port="1" /> + <edge from-layer="6024" from-port="2" to-layer="6026" to-port="0" /> + <edge from-layer="6025" from-port="0" to-layer="6026" to-port="1" /> + <edge from-layer="6026" from-port="2" to-layer="6027" to-port="0" /> + <edge from-layer="6027" from-port="1" to-layer="6028" to-port="1" /> + <edge from-layer="6028" from-port="2" to-layer="6031" to-port="0" /> + <edge from-layer="6029" from-port="0" to-layer="6030" to-port="0" /> + <edge from-layer="6030" from-port="1" to-layer="6031" to-port="1" /> + <edge from-layer="6031" from-port="2" to-layer="6033" to-port="0" /> + <edge from-layer="6032" from-port="0" to-layer="6033" to-port="1" /> + <edge from-layer="6033" from-port="2" to-layer="6035" to-port="0" /> + <edge from-layer="6034" from-port="0" to-layer="6035" to-port="1" /> + <edge from-layer="6035" from-port="2" to-layer="6036" to-port="0" /> + <edge from-layer="6035" from-port="2" to-layer="6037" to-port="0" /> + <edge from-layer="6035" from-port="2" to-layer="6053" to-port="0" /> + <edge from-layer="6035" from-port="2" to-layer="6047" to-port="0" /> + <edge from-layer="6036" from-port="2" to-layer="6056" to-port="0" /> + <edge from-layer="6037" from-port="1" to-layer="6039" to-port="0" /> + <edge from-layer="6038" from-port="0" to-layer="6039" to-port="2" /> + <edge from-layer="6039" from-port="3" to-layer="6040" to-port="0" /> + <edge from-layer="6040" from-port="2" to-layer="6041" to-port="0" /> + <edge from-layer="6041" from-port="1" to-layer="6043" to-port="0" /> + <edge from-layer="6042" from-port="0" to-layer="6043" to-port="1" /> + <edge from-layer="6043" from-port="2" to-layer="6047" to-port="1" /> + <edge from-layer="6043" from-port="2" to-layer="6053" to-port="2" /> + <edge from-layer="6044" from-port="0" to-layer="6047" to-port="2" /> + <edge from-layer="6045" from-port="0" to-layer="6047" to-port="3" /> + <edge from-layer="6046" from-port="0" to-layer="6047" to-port="4" /> + <edge from-layer="6047" from-port="5" to-layer="6049" to-port="0" /> + <edge from-layer="6048" from-port="0" to-layer="6049" to-port="1" /> + <edge from-layer="6049" from-port="2" to-layer="6054" to-port="0" /> + <edge from-layer="6050" from-port="0" to-layer="6053" to-port="1" /> + <edge from-layer="6051" from-port="0" to-layer="6053" to-port="3" /> + <edge from-layer="6052" from-port="0" to-layer="6053" to-port="4" /> + <edge from-layer="6053" from-port="5" to-layer="6054" to-port="1" /> + <edge from-layer="6054" from-port="2" to-layer="6055" to-port="0" /> + <edge from-layer="6055" from-port="2" to-layer="6056" to-port="1" /> + <edge from-layer="6056" from-port="2" to-layer="6057" to-port="1" /> + <edge from-layer="6056" from-port="2" to-layer="6117" to-port="0" /> + <edge from-layer="6057" from-port="2" to-layer="6059" to-port="0" /> + <edge from-layer="6057" from-port="2" to-layer="11190" to-port="0" /> + <edge from-layer="6057" from-port="2" to-layer="6058" to-port="0" /> + <edge from-layer="6058" from-port="2" to-layer="6068" to-port="0" /> + <edge from-layer="6059" from-port="1" to-layer="6062" to-port="0" /> + <edge from-layer="6059" from-port="1" to-layer="6066" to-port="0" /> + <edge from-layer="6060" from-port="0" to-layer="6062" to-port="1" /> + <edge from-layer="6061" from-port="0" to-layer="6062" to-port="2" /> + <edge from-layer="6062" from-port="3" to-layer="6067" to-port="0" /> + <edge from-layer="6063" from-port="0" to-layer="6067" to-port="1" /> + <edge from-layer="6064" from-port="0" to-layer="6066" to-port="1" /> + <edge from-layer="6065" from-port="0" to-layer="6066" to-port="2" /> + <edge from-layer="6066" from-port="3" to-layer="6067" to-port="2" /> + <edge from-layer="6067" from-port="3" to-layer="6068" to-port="1" /> + <edge from-layer="6068" from-port="2" to-layer="6070" to-port="0" /> + <edge from-layer="6069" from-port="0" to-layer="6070" to-port="1" /> + <edge from-layer="6070" from-port="2" to-layer="6125" to-port="1" /> + <edge from-layer="6071" from-port="0" to-layer="6076" to-port="0" /> + <edge from-layer="6072" from-port="0" to-layer="6075" to-port="1" /> + <edge from-layer="6073" from-port="0" to-layer="6075" to-port="2" /> + <edge from-layer="6074" from-port="0" to-layer="6075" to-port="3" /> + <edge from-layer="6075" from-port="4" to-layer="6076" to-port="1" /> + <edge from-layer="6076" from-port="2" to-layer="6077" to-port="0" /> + <edge from-layer="6077" from-port="1" to-layer="6079" to-port="0" /> + <edge from-layer="6078" from-port="0" to-layer="6079" to-port="2" /> + <edge from-layer="6079" from-port="3" to-layer="6098" to-port="0" /> + <edge from-layer="6080" from-port="0" to-layer="6081" to-port="0" /> + <edge from-layer="6081" from-port="1" to-layer="6084" to-port="0" /> + <edge from-layer="6082" from-port="0" to-layer="6083" to-port="0" /> + <edge from-layer="6083" from-port="1" to-layer="6084" to-port="1" /> + <edge from-layer="6084" from-port="2" to-layer="6086" to-port="0" /> + <edge from-layer="6085" from-port="0" to-layer="6086" to-port="1" /> + <edge from-layer="6086" from-port="2" to-layer="6088" to-port="0" /> + <edge from-layer="6087" from-port="0" to-layer="6088" to-port="1" /> + <edge from-layer="6088" from-port="2" to-layer="6089" to-port="0" /> + <edge from-layer="6089" from-port="1" to-layer="6090" to-port="1" /> + <edge from-layer="6090" from-port="2" to-layer="6093" to-port="0" /> + <edge from-layer="6091" from-port="0" to-layer="6092" to-port="0" /> + <edge from-layer="6092" from-port="1" to-layer="6093" to-port="1" /> + <edge from-layer="6093" from-port="2" to-layer="6095" to-port="0" /> + <edge from-layer="6094" from-port="0" to-layer="6095" to-port="1" /> + <edge from-layer="6095" from-port="2" to-layer="6097" to-port="0" /> + <edge from-layer="6096" from-port="0" to-layer="6097" to-port="1" /> + <edge from-layer="6097" from-port="2" to-layer="6098" to-port="1" /> + <edge from-layer="6098" from-port="2" to-layer="6099" to-port="0" /> + <edge from-layer="6098" from-port="2" to-layer="6100" to-port="0" /> + <edge from-layer="6098" from-port="2" to-layer="11189" to-port="0" /> + <edge from-layer="6099" from-port="2" to-layer="6109" to-port="0" /> + <edge from-layer="6100" from-port="1" to-layer="6103" to-port="0" /> + <edge from-layer="6100" from-port="1" to-layer="6107" to-port="0" /> + <edge from-layer="6101" from-port="0" to-layer="6103" to-port="1" /> + <edge from-layer="6102" from-port="0" to-layer="6103" to-port="2" /> + <edge from-layer="6103" from-port="3" to-layer="6108" to-port="1" /> + <edge from-layer="6104" from-port="0" to-layer="6108" to-port="2" /> + <edge from-layer="6105" from-port="0" to-layer="6107" to-port="1" /> + <edge from-layer="6106" from-port="0" to-layer="6107" to-port="2" /> + <edge from-layer="6107" from-port="3" to-layer="6108" to-port="3" /> + <edge from-layer="6108" from-port="4" to-layer="6109" to-port="1" /> + <edge from-layer="6109" from-port="2" to-layer="6111" to-port="0" /> + <edge from-layer="6110" from-port="0" to-layer="6111" to-port="1" /> + <edge from-layer="6111" from-port="2" to-layer="6125" to-port="2" /> + <edge from-layer="6112" from-port="0" to-layer="6124" to-port="1" /> + <edge from-layer="6113" from-port="1" to-layer="6116" to-port="0" /> + <edge from-layer="6114" from-port="0" to-layer="6116" to-port="1" /> + <edge from-layer="6115" from-port="0" to-layer="6116" to-port="2" /> + <edge from-layer="6116" from-port="3" to-layer="6121" to-port="0" /> + <edge from-layer="6117" from-port="1" to-layer="6120" to-port="0" /> + <edge from-layer="6118" from-port="0" to-layer="6120" to-port="1" /> + <edge from-layer="6119" from-port="0" to-layer="6120" to-port="2" /> + <edge from-layer="6120" from-port="3" to-layer="6121" to-port="1" /> + <edge from-layer="6121" from-port="2" to-layer="6124" to-port="2" /> + <edge from-layer="6122" from-port="0" to-layer="6124" to-port="3" /> + <edge from-layer="6123" from-port="0" to-layer="6124" to-port="4" /> + <edge from-layer="6124" from-port="5" to-layer="6125" to-port="3" /> + <edge from-layer="6125" from-port="4" to-layer="6127" to-port="0" /> + <edge from-layer="6126" from-port="0" to-layer="6127" to-port="1" /> + <edge from-layer="6127" from-port="2" to-layer="6129" to-port="0" /> + <edge from-layer="6128" from-port="0" to-layer="6129" to-port="1" /> + <edge from-layer="6129" from-port="2" to-layer="6140" to-port="0" /> + <edge from-layer="6130" from-port="0" to-layer="6131" to-port="0" /> + <edge from-layer="6131" from-port="1" to-layer="6134" to-port="0" /> + <edge from-layer="6132" from-port="0" to-layer="6133" to-port="0" /> + <edge from-layer="6133" from-port="1" to-layer="6134" to-port="1" /> + <edge from-layer="6134" from-port="2" to-layer="6136" to-port="0" /> + <edge from-layer="6135" from-port="0" to-layer="6136" to-port="1" /> + <edge from-layer="6136" from-port="2" to-layer="6138" to-port="0" /> + <edge from-layer="6137" from-port="0" to-layer="6138" to-port="1" /> + <edge from-layer="6138" from-port="2" to-layer="6139" to-port="0" /> + <edge from-layer="6139" from-port="1" to-layer="6140" to-port="1" /> + <edge from-layer="6140" from-port="2" to-layer="6141" to-port="1" /> + <edge from-layer="6141" from-port="2" to-layer="6189" to-port="0" /> + <edge from-layer="6141" from-port="2" to-layer="6152" to-port="0" /> + <edge from-layer="6141" from-port="2" to-layer="6145" to-port="0" /> + <edge from-layer="6142" from-port="0" to-layer="6153" to-port="0" /> + <edge from-layer="6143" from-port="0" to-layer="6151" to-port="0" /> + <edge from-layer="6144" from-port="0" to-layer="6145" to-port="1" /> + <edge from-layer="6145" from-port="2" to-layer="6147" to-port="0" /> + <edge from-layer="6146" from-port="0" to-layer="6147" to-port="1" /> + <edge from-layer="6147" from-port="2" to-layer="6149" to-port="0" /> + <edge from-layer="6148" from-port="0" to-layer="6149" to-port="1" /> + <edge from-layer="6149" from-port="2" to-layer="6150" to-port="0" /> + <edge from-layer="6150" from-port="1" to-layer="6151" to-port="1" /> + <edge from-layer="6151" from-port="2" to-layer="6152" to-port="1" /> + <edge from-layer="6152" from-port="2" to-layer="6153" to-port="1" /> + <edge from-layer="6153" from-port="2" to-layer="6176" to-port="0" /> + <edge from-layer="6153" from-port="2" to-layer="6164" to-port="0" /> + <edge from-layer="6154" from-port="0" to-layer="6155" to-port="0" /> + <edge from-layer="6155" from-port="1" to-layer="6158" to-port="0" /> + <edge from-layer="6156" from-port="0" to-layer="6157" to-port="0" /> + <edge from-layer="6157" from-port="1" to-layer="6158" to-port="1" /> + <edge from-layer="6158" from-port="2" to-layer="6160" to-port="0" /> + <edge from-layer="6159" from-port="0" to-layer="6160" to-port="1" /> + <edge from-layer="6160" from-port="2" to-layer="6162" to-port="0" /> + <edge from-layer="6161" from-port="0" to-layer="6162" to-port="1" /> + <edge from-layer="6162" from-port="2" to-layer="6163" to-port="0" /> + <edge from-layer="6163" from-port="1" to-layer="6164" to-port="1" /> + <edge from-layer="6164" from-port="2" to-layer="6165" to-port="0" /> + <edge from-layer="6165" from-port="1" to-layer="6177" to-port="0" /> + <edge from-layer="6166" from-port="0" to-layer="6167" to-port="0" /> + <edge from-layer="6167" from-port="1" to-layer="6170" to-port="0" /> + <edge from-layer="6168" from-port="0" to-layer="6169" to-port="0" /> + <edge from-layer="6169" from-port="1" to-layer="6170" to-port="1" /> + <edge from-layer="6170" from-port="2" to-layer="6172" to-port="0" /> + <edge from-layer="6171" from-port="0" to-layer="6172" to-port="1" /> + <edge from-layer="6172" from-port="2" to-layer="6174" to-port="0" /> + <edge from-layer="6173" from-port="0" to-layer="6174" to-port="1" /> + <edge from-layer="6174" from-port="2" to-layer="6175" to-port="0" /> + <edge from-layer="6175" from-port="1" to-layer="6176" to-port="1" /> + <edge from-layer="6176" from-port="2" to-layer="6177" to-port="1" /> + <edge from-layer="6177" from-port="2" to-layer="6188" to-port="0" /> + <edge from-layer="6178" from-port="0" to-layer="6179" to-port="0" /> + <edge from-layer="6179" from-port="1" to-layer="6182" to-port="0" /> + <edge from-layer="6180" from-port="0" to-layer="6181" to-port="0" /> + <edge from-layer="6181" from-port="1" to-layer="6182" to-port="1" /> + <edge from-layer="6182" from-port="2" to-layer="6184" to-port="0" /> + <edge from-layer="6183" from-port="0" to-layer="6184" to-port="1" /> + <edge from-layer="6184" from-port="2" to-layer="6186" to-port="0" /> + <edge from-layer="6185" from-port="0" to-layer="6186" to-port="1" /> + <edge from-layer="6186" from-port="2" to-layer="6187" to-port="0" /> + <edge from-layer="6187" from-port="1" to-layer="6188" to-port="1" /> + <edge from-layer="6188" from-port="2" to-layer="6189" to-port="1" /> + <edge from-layer="6189" from-port="2" to-layer="6373" to-port="0" /> + <edge from-layer="6189" from-port="2" to-layer="6200" to-port="0" /> + <edge from-layer="6189" from-port="2" to-layer="6193" to-port="0" /> + <edge from-layer="6190" from-port="0" to-layer="6201" to-port="0" /> + <edge from-layer="6191" from-port="0" to-layer="6199" to-port="0" /> + <edge from-layer="6192" from-port="0" to-layer="6193" to-port="1" /> + <edge from-layer="6193" from-port="2" to-layer="6195" to-port="0" /> + <edge from-layer="6194" from-port="0" to-layer="6195" to-port="1" /> + <edge from-layer="6195" from-port="2" to-layer="6197" to-port="0" /> + <edge from-layer="6196" from-port="0" to-layer="6197" to-port="1" /> + <edge from-layer="6197" from-port="2" to-layer="6198" to-port="0" /> + <edge from-layer="6198" from-port="1" to-layer="6199" to-port="1" /> + <edge from-layer="6199" from-port="2" to-layer="6200" to-port="1" /> + <edge from-layer="6200" from-port="2" to-layer="6201" to-port="1" /> + <edge from-layer="6201" from-port="2" to-layer="6322" to-port="0" /> + <edge from-layer="6201" from-port="2" to-layer="6260" to-port="0" /> + <edge from-layer="6201" from-port="2" to-layer="6212" to-port="0" /> + <edge from-layer="6202" from-port="0" to-layer="6203" to-port="0" /> + <edge from-layer="6203" from-port="1" to-layer="6206" to-port="0" /> + <edge from-layer="6204" from-port="0" to-layer="6205" to-port="0" /> + <edge from-layer="6205" from-port="1" to-layer="6206" to-port="1" /> + <edge from-layer="6206" from-port="2" to-layer="6208" to-port="0" /> + <edge from-layer="6207" from-port="0" to-layer="6208" to-port="1" /> + <edge from-layer="6208" from-port="2" to-layer="6210" to-port="0" /> + <edge from-layer="6209" from-port="0" to-layer="6210" to-port="1" /> + <edge from-layer="6210" from-port="2" to-layer="6211" to-port="0" /> + <edge from-layer="6211" from-port="1" to-layer="6212" to-port="1" /> + <edge from-layer="6212" from-port="2" to-layer="6215" to-port="0" /> + <edge from-layer="6213" from-port="0" to-layer="6214" to-port="0" /> + <edge from-layer="6214" from-port="1" to-layer="6215" to-port="1" /> + <edge from-layer="6215" from-port="2" to-layer="6217" to-port="0" /> + <edge from-layer="6216" from-port="0" to-layer="6217" to-port="1" /> + <edge from-layer="6217" from-port="2" to-layer="6219" to-port="0" /> + <edge from-layer="6218" from-port="0" to-layer="6219" to-port="1" /> + <edge from-layer="6219" from-port="2" to-layer="6237" to-port="0" /> + <edge from-layer="6219" from-port="2" to-layer="6231" to-port="0" /> + <edge from-layer="6219" from-port="2" to-layer="6221" to-port="0" /> + <edge from-layer="6219" from-port="2" to-layer="6220" to-port="0" /> + <edge from-layer="6220" from-port="2" to-layer="6240" to-port="0" /> + <edge from-layer="6221" from-port="1" to-layer="6223" to-port="0" /> + <edge from-layer="6222" from-port="0" to-layer="6223" to-port="2" /> + <edge from-layer="6223" from-port="3" to-layer="6224" to-port="0" /> + <edge from-layer="6224" from-port="2" to-layer="6225" to-port="0" /> + <edge from-layer="6225" from-port="1" to-layer="6227" to-port="0" /> + <edge from-layer="6226" from-port="0" to-layer="6227" to-port="1" /> + <edge from-layer="6227" from-port="2" to-layer="6231" to-port="1" /> + <edge from-layer="6227" from-port="2" to-layer="6237" to-port="2" /> + <edge from-layer="6228" from-port="0" to-layer="6231" to-port="2" /> + <edge from-layer="6229" from-port="0" to-layer="6231" to-port="3" /> + <edge from-layer="6230" from-port="0" to-layer="6231" to-port="4" /> + <edge from-layer="6231" from-port="5" to-layer="6233" to-port="0" /> + <edge from-layer="6232" from-port="0" to-layer="6233" to-port="1" /> + <edge from-layer="6233" from-port="2" to-layer="6238" to-port="0" /> + <edge from-layer="6234" from-port="0" to-layer="6237" to-port="1" /> + <edge from-layer="6235" from-port="0" to-layer="6237" to-port="3" /> + <edge from-layer="6236" from-port="0" to-layer="6237" to-port="4" /> + <edge from-layer="6237" from-port="5" to-layer="6238" to-port="1" /> + <edge from-layer="6238" from-port="2" to-layer="6239" to-port="0" /> + <edge from-layer="6239" from-port="2" to-layer="6240" to-port="1" /> + <edge from-layer="6240" from-port="2" to-layer="6357" to-port="0" /> + <edge from-layer="6241" from-port="0" to-layer="6246" to-port="0" /> + <edge from-layer="6242" from-port="0" to-layer="6245" to-port="1" /> + <edge from-layer="6243" from-port="0" to-layer="6245" to-port="2" /> + <edge from-layer="6244" from-port="0" to-layer="6245" to-port="3" /> + <edge from-layer="6245" from-port="4" to-layer="6246" to-port="1" /> + <edge from-layer="6246" from-port="2" to-layer="6247" to-port="0" /> + <edge from-layer="6247" from-port="1" to-layer="6249" to-port="0" /> + <edge from-layer="6248" from-port="0" to-layer="6249" to-port="2" /> + <edge from-layer="6249" from-port="3" to-layer="6345" to-port="0" /> + <edge from-layer="6249" from-port="3" to-layer="6289" to-port="0" /> + <edge from-layer="6250" from-port="0" to-layer="6251" to-port="0" /> + <edge from-layer="6251" from-port="1" to-layer="6254" to-port="0" /> + <edge from-layer="6252" from-port="0" to-layer="6253" to-port="0" /> + <edge from-layer="6253" from-port="1" to-layer="6254" to-port="1" /> + <edge from-layer="6254" from-port="2" to-layer="6256" to-port="0" /> + <edge from-layer="6255" from-port="0" to-layer="6256" to-port="1" /> + <edge from-layer="6256" from-port="2" to-layer="6258" to-port="0" /> + <edge from-layer="6257" from-port="0" to-layer="6258" to-port="1" /> + <edge from-layer="6258" from-port="2" to-layer="6259" to-port="0" /> + <edge from-layer="6259" from-port="1" to-layer="6260" to-port="1" /> + <edge from-layer="6260" from-port="2" to-layer="6263" to-port="0" /> + <edge from-layer="6261" from-port="0" to-layer="6262" to-port="0" /> + <edge from-layer="6262" from-port="1" to-layer="6263" to-port="1" /> + <edge from-layer="6263" from-port="2" to-layer="6265" to-port="0" /> + <edge from-layer="6264" from-port="0" to-layer="6265" to-port="1" /> + <edge from-layer="6265" from-port="2" to-layer="6267" to-port="0" /> + <edge from-layer="6266" from-port="0" to-layer="6267" to-port="1" /> + <edge from-layer="6267" from-port="2" to-layer="6268" to-port="0" /> + <edge from-layer="6267" from-port="2" to-layer="6269" to-port="0" /> + <edge from-layer="6267" from-port="2" to-layer="6285" to-port="0" /> + <edge from-layer="6267" from-port="2" to-layer="6279" to-port="0" /> + <edge from-layer="6268" from-port="2" to-layer="6288" to-port="0" /> + <edge from-layer="6269" from-port="1" to-layer="6271" to-port="0" /> + <edge from-layer="6270" from-port="0" to-layer="6271" to-port="2" /> + <edge from-layer="6271" from-port="3" to-layer="6272" to-port="0" /> + <edge from-layer="6272" from-port="2" to-layer="6273" to-port="0" /> + <edge from-layer="6273" from-port="1" to-layer="6275" to-port="0" /> + <edge from-layer="6274" from-port="0" to-layer="6275" to-port="1" /> + <edge from-layer="6275" from-port="2" to-layer="6279" to-port="1" /> + <edge from-layer="6275" from-port="2" to-layer="6285" to-port="2" /> + <edge from-layer="6276" from-port="0" to-layer="6279" to-port="2" /> + <edge from-layer="6277" from-port="0" to-layer="6279" to-port="3" /> + <edge from-layer="6278" from-port="0" to-layer="6279" to-port="4" /> + <edge from-layer="6279" from-port="5" to-layer="6281" to-port="0" /> + <edge from-layer="6280" from-port="0" to-layer="6281" to-port="1" /> + <edge from-layer="6281" from-port="2" to-layer="6286" to-port="0" /> + <edge from-layer="6282" from-port="0" to-layer="6285" to-port="1" /> + <edge from-layer="6283" from-port="0" to-layer="6285" to-port="3" /> + <edge from-layer="6284" from-port="0" to-layer="6285" to-port="4" /> + <edge from-layer="6285" from-port="5" to-layer="6286" to-port="1" /> + <edge from-layer="6286" from-port="2" to-layer="6287" to-port="0" /> + <edge from-layer="6287" from-port="2" to-layer="6288" to-port="1" /> + <edge from-layer="6288" from-port="2" to-layer="6289" to-port="1" /> + <edge from-layer="6288" from-port="2" to-layer="6349" to-port="0" /> + <edge from-layer="6289" from-port="2" to-layer="6290" to-port="0" /> + <edge from-layer="6289" from-port="2" to-layer="6291" to-port="0" /> + <edge from-layer="6289" from-port="2" to-layer="11188" to-port="0" /> + <edge from-layer="6290" from-port="2" to-layer="6300" to-port="0" /> + <edge from-layer="6291" from-port="1" to-layer="6294" to-port="0" /> + <edge from-layer="6291" from-port="1" to-layer="6298" to-port="0" /> + <edge from-layer="6292" from-port="0" to-layer="6294" to-port="1" /> + <edge from-layer="6293" from-port="0" to-layer="6294" to-port="2" /> + <edge from-layer="6294" from-port="3" to-layer="6299" to-port="0" /> + <edge from-layer="6295" from-port="0" to-layer="6299" to-port="1" /> + <edge from-layer="6296" from-port="0" to-layer="6298" to-port="1" /> + <edge from-layer="6297" from-port="0" to-layer="6298" to-port="2" /> + <edge from-layer="6298" from-port="3" to-layer="6299" to-port="2" /> + <edge from-layer="6299" from-port="3" to-layer="6300" to-port="1" /> + <edge from-layer="6300" from-port="2" to-layer="6302" to-port="0" /> + <edge from-layer="6301" from-port="0" to-layer="6302" to-port="1" /> + <edge from-layer="6302" from-port="2" to-layer="6357" to-port="1" /> + <edge from-layer="6303" from-port="0" to-layer="6308" to-port="0" /> + <edge from-layer="6304" from-port="0" to-layer="6307" to-port="1" /> + <edge from-layer="6305" from-port="0" to-layer="6307" to-port="2" /> + <edge from-layer="6306" from-port="0" to-layer="6307" to-port="3" /> + <edge from-layer="6307" from-port="4" to-layer="6308" to-port="1" /> + <edge from-layer="6308" from-port="2" to-layer="6309" to-port="0" /> + <edge from-layer="6309" from-port="1" to-layer="6311" to-port="0" /> + <edge from-layer="6310" from-port="0" to-layer="6311" to-port="2" /> + <edge from-layer="6311" from-port="3" to-layer="6330" to-port="0" /> + <edge from-layer="6312" from-port="0" to-layer="6313" to-port="0" /> + <edge from-layer="6313" from-port="1" to-layer="6316" to-port="0" /> + <edge from-layer="6314" from-port="0" to-layer="6315" to-port="0" /> + <edge from-layer="6315" from-port="1" to-layer="6316" to-port="1" /> + <edge from-layer="6316" from-port="2" to-layer="6318" to-port="0" /> + <edge from-layer="6317" from-port="0" to-layer="6318" to-port="1" /> + <edge from-layer="6318" from-port="2" to-layer="6320" to-port="0" /> + <edge from-layer="6319" from-port="0" to-layer="6320" to-port="1" /> + <edge from-layer="6320" from-port="2" to-layer="6321" to-port="0" /> + <edge from-layer="6321" from-port="1" to-layer="6322" to-port="1" /> + <edge from-layer="6322" from-port="2" to-layer="6325" to-port="0" /> + <edge from-layer="6323" from-port="0" to-layer="6324" to-port="0" /> + <edge from-layer="6324" from-port="1" to-layer="6325" to-port="1" /> + <edge from-layer="6325" from-port="2" to-layer="6327" to-port="0" /> + <edge from-layer="6326" from-port="0" to-layer="6327" to-port="1" /> + <edge from-layer="6327" from-port="2" to-layer="6329" to-port="0" /> + <edge from-layer="6328" from-port="0" to-layer="6329" to-port="1" /> + <edge from-layer="6329" from-port="2" to-layer="6330" to-port="1" /> + <edge from-layer="6330" from-port="2" to-layer="11187" to-port="0" /> + <edge from-layer="6330" from-port="2" to-layer="6331" to-port="0" /> + <edge from-layer="6330" from-port="2" to-layer="6332" to-port="0" /> + <edge from-layer="6331" from-port="2" to-layer="6341" to-port="0" /> + <edge from-layer="6332" from-port="1" to-layer="6339" to-port="0" /> + <edge from-layer="6332" from-port="1" to-layer="6335" to-port="0" /> + <edge from-layer="6333" from-port="0" to-layer="6335" to-port="1" /> + <edge from-layer="6334" from-port="0" to-layer="6335" to-port="2" /> + <edge from-layer="6335" from-port="3" to-layer="6340" to-port="1" /> + <edge from-layer="6336" from-port="0" to-layer="6340" to-port="2" /> + <edge from-layer="6337" from-port="0" to-layer="6339" to-port="1" /> + <edge from-layer="6338" from-port="0" to-layer="6339" to-port="2" /> + <edge from-layer="6339" from-port="3" to-layer="6340" to-port="3" /> + <edge from-layer="6340" from-port="4" to-layer="6341" to-port="1" /> + <edge from-layer="6341" from-port="2" to-layer="6343" to-port="0" /> + <edge from-layer="6342" from-port="0" to-layer="6343" to-port="1" /> + <edge from-layer="6343" from-port="2" to-layer="6357" to-port="2" /> + <edge from-layer="6344" from-port="0" to-layer="6356" to-port="1" /> + <edge from-layer="6345" from-port="1" to-layer="6348" to-port="0" /> + <edge from-layer="6346" from-port="0" to-layer="6348" to-port="1" /> + <edge from-layer="6347" from-port="0" to-layer="6348" to-port="2" /> + <edge from-layer="6348" from-port="3" to-layer="6353" to-port="0" /> + <edge from-layer="6349" from-port="1" to-layer="6352" to-port="0" /> + <edge from-layer="6350" from-port="0" to-layer="6352" to-port="1" /> + <edge from-layer="6351" from-port="0" to-layer="6352" to-port="2" /> + <edge from-layer="6352" from-port="3" to-layer="6353" to-port="1" /> + <edge from-layer="6353" from-port="2" to-layer="6356" to-port="2" /> + <edge from-layer="6354" from-port="0" to-layer="6356" to-port="3" /> + <edge from-layer="6355" from-port="0" to-layer="6356" to-port="4" /> + <edge from-layer="6356" from-port="5" to-layer="6357" to-port="3" /> + <edge from-layer="6357" from-port="4" to-layer="6359" to-port="0" /> + <edge from-layer="6358" from-port="0" to-layer="6359" to-port="1" /> + <edge from-layer="6359" from-port="2" to-layer="6361" to-port="0" /> + <edge from-layer="6360" from-port="0" to-layer="6361" to-port="1" /> + <edge from-layer="6361" from-port="2" to-layer="6372" to-port="0" /> + <edge from-layer="6362" from-port="0" to-layer="6363" to-port="0" /> + <edge from-layer="6363" from-port="1" to-layer="6366" to-port="0" /> + <edge from-layer="6364" from-port="0" to-layer="6365" to-port="0" /> + <edge from-layer="6365" from-port="1" to-layer="6366" to-port="1" /> + <edge from-layer="6366" from-port="2" to-layer="6368" to-port="0" /> + <edge from-layer="6367" from-port="0" to-layer="6368" to-port="1" /> + <edge from-layer="6368" from-port="2" to-layer="6370" to-port="0" /> + <edge from-layer="6369" from-port="0" to-layer="6370" to-port="1" /> + <edge from-layer="6370" from-port="2" to-layer="6371" to-port="0" /> + <edge from-layer="6371" from-port="1" to-layer="6372" to-port="1" /> + <edge from-layer="6372" from-port="2" to-layer="6373" to-port="1" /> + <edge from-layer="6373" from-port="2" to-layer="6384" to-port="0" /> + <edge from-layer="6373" from-port="2" to-layer="6421" to-port="0" /> + <edge from-layer="6373" from-port="2" to-layer="6377" to-port="0" /> + <edge from-layer="6374" from-port="0" to-layer="6385" to-port="0" /> + <edge from-layer="6375" from-port="0" to-layer="6383" to-port="0" /> + <edge from-layer="6376" from-port="0" to-layer="6377" to-port="1" /> + <edge from-layer="6377" from-port="2" to-layer="6379" to-port="0" /> + <edge from-layer="6378" from-port="0" to-layer="6379" to-port="1" /> + <edge from-layer="6379" from-port="2" to-layer="6381" to-port="0" /> + <edge from-layer="6380" from-port="0" to-layer="6381" to-port="1" /> + <edge from-layer="6381" from-port="2" to-layer="6382" to-port="0" /> + <edge from-layer="6382" from-port="1" to-layer="6383" to-port="1" /> + <edge from-layer="6383" from-port="2" to-layer="6384" to-port="1" /> + <edge from-layer="6384" from-port="2" to-layer="6385" to-port="1" /> + <edge from-layer="6385" from-port="2" to-layer="6396" to-port="0" /> + <edge from-layer="6385" from-port="2" to-layer="6408" to-port="0" /> + <edge from-layer="6386" from-port="0" to-layer="6387" to-port="0" /> + <edge from-layer="6387" from-port="1" to-layer="6390" to-port="0" /> + <edge from-layer="6388" from-port="0" to-layer="6389" to-port="0" /> + <edge from-layer="6389" from-port="1" to-layer="6390" to-port="1" /> + <edge from-layer="6390" from-port="2" to-layer="6392" to-port="0" /> + <edge from-layer="6391" from-port="0" to-layer="6392" to-port="1" /> + <edge from-layer="6392" from-port="2" to-layer="6394" to-port="0" /> + <edge from-layer="6393" from-port="0" to-layer="6394" to-port="1" /> + <edge from-layer="6394" from-port="2" to-layer="6395" to-port="0" /> + <edge from-layer="6395" from-port="1" to-layer="6396" to-port="1" /> + <edge from-layer="6396" from-port="2" to-layer="6397" to-port="0" /> + <edge from-layer="6397" from-port="1" to-layer="6409" to-port="0" /> + <edge from-layer="6398" from-port="0" to-layer="6399" to-port="0" /> + <edge from-layer="6399" from-port="1" to-layer="6402" to-port="0" /> + <edge from-layer="6400" from-port="0" to-layer="6401" to-port="0" /> + <edge from-layer="6401" from-port="1" to-layer="6402" to-port="1" /> + <edge from-layer="6402" from-port="2" to-layer="6404" to-port="0" /> + <edge from-layer="6403" from-port="0" to-layer="6404" to-port="1" /> + <edge from-layer="6404" from-port="2" to-layer="6406" to-port="0" /> + <edge from-layer="6405" from-port="0" to-layer="6406" to-port="1" /> + <edge from-layer="6406" from-port="2" to-layer="6407" to-port="0" /> + <edge from-layer="6407" from-port="1" to-layer="6408" to-port="1" /> + <edge from-layer="6408" from-port="2" to-layer="6409" to-port="1" /> + <edge from-layer="6409" from-port="2" to-layer="6420" to-port="0" /> + <edge from-layer="6410" from-port="0" to-layer="6411" to-port="0" /> + <edge from-layer="6411" from-port="1" to-layer="6414" to-port="0" /> + <edge from-layer="6412" from-port="0" to-layer="6413" to-port="0" /> + <edge from-layer="6413" from-port="1" to-layer="6414" to-port="1" /> + <edge from-layer="6414" from-port="2" to-layer="6416" to-port="0" /> + <edge from-layer="6415" from-port="0" to-layer="6416" to-port="1" /> + <edge from-layer="6416" from-port="2" to-layer="6418" to-port="0" /> + <edge from-layer="6417" from-port="0" to-layer="6418" to-port="1" /> + <edge from-layer="6418" from-port="2" to-layer="6419" to-port="0" /> + <edge from-layer="6419" from-port="1" to-layer="6420" to-port="1" /> + <edge from-layer="6420" from-port="2" to-layer="6421" to-port="1" /> + <edge from-layer="6421" from-port="2" to-layer="6432" to-port="0" /> + <edge from-layer="6421" from-port="2" to-layer="6425" to-port="0" /> + <edge from-layer="6421" from-port="2" to-layer="6605" to-port="0" /> + <edge from-layer="6422" from-port="0" to-layer="6433" to-port="0" /> + <edge from-layer="6423" from-port="0" to-layer="6431" to-port="0" /> + <edge from-layer="6424" from-port="0" to-layer="6425" to-port="1" /> + <edge from-layer="6425" from-port="2" to-layer="6427" to-port="0" /> + <edge from-layer="6426" from-port="0" to-layer="6427" to-port="1" /> + <edge from-layer="6427" from-port="2" to-layer="6429" to-port="0" /> + <edge from-layer="6428" from-port="0" to-layer="6429" to-port="1" /> + <edge from-layer="6429" from-port="2" to-layer="6430" to-port="0" /> + <edge from-layer="6430" from-port="1" to-layer="6431" to-port="1" /> + <edge from-layer="6431" from-port="2" to-layer="6432" to-port="1" /> + <edge from-layer="6432" from-port="2" to-layer="6433" to-port="1" /> + <edge from-layer="6433" from-port="2" to-layer="6554" to-port="0" /> + <edge from-layer="6433" from-port="2" to-layer="6492" to-port="0" /> + <edge from-layer="6433" from-port="2" to-layer="6444" to-port="0" /> + <edge from-layer="6434" from-port="0" to-layer="6435" to-port="0" /> + <edge from-layer="6435" from-port="1" to-layer="6438" to-port="0" /> + <edge from-layer="6436" from-port="0" to-layer="6437" to-port="0" /> + <edge from-layer="6437" from-port="1" to-layer="6438" to-port="1" /> + <edge from-layer="6438" from-port="2" to-layer="6440" to-port="0" /> + <edge from-layer="6439" from-port="0" to-layer="6440" to-port="1" /> + <edge from-layer="6440" from-port="2" to-layer="6442" to-port="0" /> + <edge from-layer="6441" from-port="0" to-layer="6442" to-port="1" /> + <edge from-layer="6442" from-port="2" to-layer="6443" to-port="0" /> + <edge from-layer="6443" from-port="1" to-layer="6444" to-port="1" /> + <edge from-layer="6444" from-port="2" to-layer="6447" to-port="0" /> + <edge from-layer="6445" from-port="0" to-layer="6446" to-port="0" /> + <edge from-layer="6446" from-port="1" to-layer="6447" to-port="1" /> + <edge from-layer="6447" from-port="2" to-layer="6449" to-port="0" /> + <edge from-layer="6448" from-port="0" to-layer="6449" to-port="1" /> + <edge from-layer="6449" from-port="2" to-layer="6451" to-port="0" /> + <edge from-layer="6450" from-port="0" to-layer="6451" to-port="1" /> + <edge from-layer="6451" from-port="2" to-layer="6463" to-port="0" /> + <edge from-layer="6451" from-port="2" to-layer="6469" to-port="0" /> + <edge from-layer="6451" from-port="2" to-layer="6453" to-port="0" /> + <edge from-layer="6451" from-port="2" to-layer="6452" to-port="0" /> + <edge from-layer="6452" from-port="2" to-layer="6472" to-port="0" /> + <edge from-layer="6453" from-port="1" to-layer="6455" to-port="0" /> + <edge from-layer="6454" from-port="0" to-layer="6455" to-port="2" /> + <edge from-layer="6455" from-port="3" to-layer="6456" to-port="0" /> + <edge from-layer="6456" from-port="2" to-layer="6457" to-port="0" /> + <edge from-layer="6457" from-port="1" to-layer="6459" to-port="0" /> + <edge from-layer="6458" from-port="0" to-layer="6459" to-port="1" /> + <edge from-layer="6459" from-port="2" to-layer="6463" to-port="1" /> + <edge from-layer="6459" from-port="2" to-layer="6469" to-port="2" /> + <edge from-layer="6460" from-port="0" to-layer="6463" to-port="2" /> + <edge from-layer="6461" from-port="0" to-layer="6463" to-port="3" /> + <edge from-layer="6462" from-port="0" to-layer="6463" to-port="4" /> + <edge from-layer="6463" from-port="5" to-layer="6465" to-port="0" /> + <edge from-layer="6464" from-port="0" to-layer="6465" to-port="1" /> + <edge from-layer="6465" from-port="2" to-layer="6470" to-port="0" /> + <edge from-layer="6466" from-port="0" to-layer="6469" to-port="1" /> + <edge from-layer="6467" from-port="0" to-layer="6469" to-port="3" /> + <edge from-layer="6468" from-port="0" to-layer="6469" to-port="4" /> + <edge from-layer="6469" from-port="5" to-layer="6470" to-port="1" /> + <edge from-layer="6470" from-port="2" to-layer="6471" to-port="0" /> + <edge from-layer="6471" from-port="2" to-layer="6472" to-port="1" /> + <edge from-layer="6472" from-port="2" to-layer="6589" to-port="0" /> + <edge from-layer="6473" from-port="0" to-layer="6478" to-port="0" /> + <edge from-layer="6474" from-port="0" to-layer="6477" to-port="1" /> + <edge from-layer="6475" from-port="0" to-layer="6477" to-port="2" /> + <edge from-layer="6476" from-port="0" to-layer="6477" to-port="3" /> + <edge from-layer="6477" from-port="4" to-layer="6478" to-port="1" /> + <edge from-layer="6478" from-port="2" to-layer="6479" to-port="0" /> + <edge from-layer="6479" from-port="1" to-layer="6481" to-port="0" /> + <edge from-layer="6480" from-port="0" to-layer="6481" to-port="2" /> + <edge from-layer="6481" from-port="3" to-layer="6521" to-port="0" /> + <edge from-layer="6481" from-port="3" to-layer="6577" to-port="0" /> + <edge from-layer="6482" from-port="0" to-layer="6483" to-port="0" /> + <edge from-layer="6483" from-port="1" to-layer="6486" to-port="0" /> + <edge from-layer="6484" from-port="0" to-layer="6485" to-port="0" /> + <edge from-layer="6485" from-port="1" to-layer="6486" to-port="1" /> + <edge from-layer="6486" from-port="2" to-layer="6488" to-port="0" /> + <edge from-layer="6487" from-port="0" to-layer="6488" to-port="1" /> + <edge from-layer="6488" from-port="2" to-layer="6490" to-port="0" /> + <edge from-layer="6489" from-port="0" to-layer="6490" to-port="1" /> + <edge from-layer="6490" from-port="2" to-layer="6491" to-port="0" /> + <edge from-layer="6491" from-port="1" to-layer="6492" to-port="1" /> + <edge from-layer="6492" from-port="2" to-layer="6495" to-port="0" /> + <edge from-layer="6493" from-port="0" to-layer="6494" to-port="0" /> + <edge from-layer="6494" from-port="1" to-layer="6495" to-port="1" /> + <edge from-layer="6495" from-port="2" to-layer="6497" to-port="0" /> + <edge from-layer="6496" from-port="0" to-layer="6497" to-port="1" /> + <edge from-layer="6497" from-port="2" to-layer="6499" to-port="0" /> + <edge from-layer="6498" from-port="0" to-layer="6499" to-port="1" /> + <edge from-layer="6499" from-port="2" to-layer="6517" to-port="0" /> + <edge from-layer="6499" from-port="2" to-layer="6511" to-port="0" /> + <edge from-layer="6499" from-port="2" to-layer="6500" to-port="0" /> + <edge from-layer="6499" from-port="2" to-layer="6501" to-port="0" /> + <edge from-layer="6500" from-port="2" to-layer="6520" to-port="0" /> + <edge from-layer="6501" from-port="1" to-layer="6503" to-port="0" /> + <edge from-layer="6502" from-port="0" to-layer="6503" to-port="2" /> + <edge from-layer="6503" from-port="3" to-layer="6504" to-port="0" /> + <edge from-layer="6504" from-port="2" to-layer="6505" to-port="0" /> + <edge from-layer="6505" from-port="1" to-layer="6507" to-port="0" /> + <edge from-layer="6506" from-port="0" to-layer="6507" to-port="1" /> + <edge from-layer="6507" from-port="2" to-layer="6511" to-port="1" /> + <edge from-layer="6507" from-port="2" to-layer="6517" to-port="2" /> + <edge from-layer="6508" from-port="0" to-layer="6511" to-port="2" /> + <edge from-layer="6509" from-port="0" to-layer="6511" to-port="3" /> + <edge from-layer="6510" from-port="0" to-layer="6511" to-port="4" /> + <edge from-layer="6511" from-port="5" to-layer="6513" to-port="0" /> + <edge from-layer="6512" from-port="0" to-layer="6513" to-port="1" /> + <edge from-layer="6513" from-port="2" to-layer="6518" to-port="0" /> + <edge from-layer="6514" from-port="0" to-layer="6517" to-port="1" /> + <edge from-layer="6515" from-port="0" to-layer="6517" to-port="3" /> + <edge from-layer="6516" from-port="0" to-layer="6517" to-port="4" /> + <edge from-layer="6517" from-port="5" to-layer="6518" to-port="1" /> + <edge from-layer="6518" from-port="2" to-layer="6519" to-port="0" /> + <edge from-layer="6519" from-port="2" to-layer="6520" to-port="1" /> + <edge from-layer="6520" from-port="2" to-layer="6521" to-port="1" /> + <edge from-layer="6520" from-port="2" to-layer="6581" to-port="0" /> + <edge from-layer="6521" from-port="2" to-layer="6523" to-port="0" /> + <edge from-layer="6521" from-port="2" to-layer="11186" to-port="0" /> + <edge from-layer="6521" from-port="2" to-layer="6522" to-port="0" /> + <edge from-layer="6522" from-port="2" to-layer="6532" to-port="0" /> + <edge from-layer="6523" from-port="1" to-layer="6530" to-port="0" /> + <edge from-layer="6523" from-port="1" to-layer="6526" to-port="0" /> + <edge from-layer="6524" from-port="0" to-layer="6526" to-port="1" /> + <edge from-layer="6525" from-port="0" to-layer="6526" to-port="2" /> + <edge from-layer="6526" from-port="3" to-layer="6531" to-port="0" /> + <edge from-layer="6527" from-port="0" to-layer="6531" to-port="1" /> + <edge from-layer="6528" from-port="0" to-layer="6530" to-port="1" /> + <edge from-layer="6529" from-port="0" to-layer="6530" to-port="2" /> + <edge from-layer="6530" from-port="3" to-layer="6531" to-port="2" /> + <edge from-layer="6531" from-port="3" to-layer="6532" to-port="1" /> + <edge from-layer="6532" from-port="2" to-layer="6534" to-port="0" /> + <edge from-layer="6533" from-port="0" to-layer="6534" to-port="1" /> + <edge from-layer="6534" from-port="2" to-layer="6589" to-port="1" /> + <edge from-layer="6535" from-port="0" to-layer="6540" to-port="0" /> + <edge from-layer="6536" from-port="0" to-layer="6539" to-port="1" /> + <edge from-layer="6537" from-port="0" to-layer="6539" to-port="2" /> + <edge from-layer="6538" from-port="0" to-layer="6539" to-port="3" /> + <edge from-layer="6539" from-port="4" to-layer="6540" to-port="1" /> + <edge from-layer="6540" from-port="2" to-layer="6541" to-port="0" /> + <edge from-layer="6541" from-port="1" to-layer="6543" to-port="0" /> + <edge from-layer="6542" from-port="0" to-layer="6543" to-port="2" /> + <edge from-layer="6543" from-port="3" to-layer="6562" to-port="0" /> + <edge from-layer="6544" from-port="0" to-layer="6545" to-port="0" /> + <edge from-layer="6545" from-port="1" to-layer="6548" to-port="0" /> + <edge from-layer="6546" from-port="0" to-layer="6547" to-port="0" /> + <edge from-layer="6547" from-port="1" to-layer="6548" to-port="1" /> + <edge from-layer="6548" from-port="2" to-layer="6550" to-port="0" /> + <edge from-layer="6549" from-port="0" to-layer="6550" to-port="1" /> + <edge from-layer="6550" from-port="2" to-layer="6552" to-port="0" /> + <edge from-layer="6551" from-port="0" to-layer="6552" to-port="1" /> + <edge from-layer="6552" from-port="2" to-layer="6553" to-port="0" /> + <edge from-layer="6553" from-port="1" to-layer="6554" to-port="1" /> + <edge from-layer="6554" from-port="2" to-layer="6557" to-port="0" /> + <edge from-layer="6555" from-port="0" to-layer="6556" to-port="0" /> + <edge from-layer="6556" from-port="1" to-layer="6557" to-port="1" /> + <edge from-layer="6557" from-port="2" to-layer="6559" to-port="0" /> + <edge from-layer="6558" from-port="0" to-layer="6559" to-port="1" /> + <edge from-layer="6559" from-port="2" to-layer="6561" to-port="0" /> + <edge from-layer="6560" from-port="0" to-layer="6561" to-port="1" /> + <edge from-layer="6561" from-port="2" to-layer="6562" to-port="1" /> + <edge from-layer="6562" from-port="2" to-layer="6564" to-port="0" /> + <edge from-layer="6562" from-port="2" to-layer="6563" to-port="0" /> + <edge from-layer="6562" from-port="2" to-layer="11185" to-port="0" /> + <edge from-layer="6563" from-port="2" to-layer="6573" to-port="0" /> + <edge from-layer="6564" from-port="1" to-layer="6567" to-port="0" /> + <edge from-layer="6564" from-port="1" to-layer="6571" to-port="0" /> + <edge from-layer="6565" from-port="0" to-layer="6567" to-port="1" /> + <edge from-layer="6566" from-port="0" to-layer="6567" to-port="2" /> + <edge from-layer="6567" from-port="3" to-layer="6572" to-port="1" /> + <edge from-layer="6568" from-port="0" to-layer="6572" to-port="2" /> + <edge from-layer="6569" from-port="0" to-layer="6571" to-port="1" /> + <edge from-layer="6570" from-port="0" to-layer="6571" to-port="2" /> + <edge from-layer="6571" from-port="3" to-layer="6572" to-port="3" /> + <edge from-layer="6572" from-port="4" to-layer="6573" to-port="1" /> + <edge from-layer="6573" from-port="2" to-layer="6575" to-port="0" /> + <edge from-layer="6574" from-port="0" to-layer="6575" to-port="1" /> + <edge from-layer="6575" from-port="2" to-layer="6589" to-port="2" /> + <edge from-layer="6576" from-port="0" to-layer="6588" to-port="1" /> + <edge from-layer="6577" from-port="1" to-layer="6580" to-port="0" /> + <edge from-layer="6578" from-port="0" to-layer="6580" to-port="1" /> + <edge from-layer="6579" from-port="0" to-layer="6580" to-port="2" /> + <edge from-layer="6580" from-port="3" to-layer="6585" to-port="0" /> + <edge from-layer="6581" from-port="1" to-layer="6584" to-port="0" /> + <edge from-layer="6582" from-port="0" to-layer="6584" to-port="1" /> + <edge from-layer="6583" from-port="0" to-layer="6584" to-port="2" /> + <edge from-layer="6584" from-port="3" to-layer="6585" to-port="1" /> + <edge from-layer="6585" from-port="2" to-layer="6588" to-port="2" /> + <edge from-layer="6586" from-port="0" to-layer="6588" to-port="3" /> + <edge from-layer="6587" from-port="0" to-layer="6588" to-port="4" /> + <edge from-layer="6588" from-port="5" to-layer="6589" to-port="3" /> + <edge from-layer="6589" from-port="4" to-layer="6591" to-port="0" /> + <edge from-layer="6590" from-port="0" to-layer="6591" to-port="1" /> + <edge from-layer="6591" from-port="2" to-layer="6593" to-port="0" /> + <edge from-layer="6592" from-port="0" to-layer="6593" to-port="1" /> + <edge from-layer="6593" from-port="2" to-layer="6604" to-port="0" /> + <edge from-layer="6594" from-port="0" to-layer="6595" to-port="0" /> + <edge from-layer="6595" from-port="1" to-layer="6598" to-port="0" /> + <edge from-layer="6596" from-port="0" to-layer="6597" to-port="0" /> + <edge from-layer="6597" from-port="1" to-layer="6598" to-port="1" /> + <edge from-layer="6598" from-port="2" to-layer="6600" to-port="0" /> + <edge from-layer="6599" from-port="0" to-layer="6600" to-port="1" /> + <edge from-layer="6600" from-port="2" to-layer="6602" to-port="0" /> + <edge from-layer="6601" from-port="0" to-layer="6602" to-port="1" /> + <edge from-layer="6602" from-port="2" to-layer="6603" to-port="0" /> + <edge from-layer="6603" from-port="1" to-layer="6604" to-port="1" /> + <edge from-layer="6604" from-port="2" to-layer="6605" to-port="1" /> + <edge from-layer="6605" from-port="2" to-layer="6653" to-port="0" /> + <edge from-layer="6605" from-port="2" to-layer="6616" to-port="0" /> + <edge from-layer="6605" from-port="2" to-layer="6609" to-port="0" /> + <edge from-layer="6606" from-port="0" to-layer="6617" to-port="0" /> + <edge from-layer="6607" from-port="0" to-layer="6615" to-port="0" /> + <edge from-layer="6608" from-port="0" to-layer="6609" to-port="1" /> + <edge from-layer="6609" from-port="2" to-layer="6611" to-port="0" /> + <edge from-layer="6610" from-port="0" to-layer="6611" to-port="1" /> + <edge from-layer="6611" from-port="2" to-layer="6613" to-port="0" /> + <edge from-layer="6612" from-port="0" to-layer="6613" to-port="1" /> + <edge from-layer="6613" from-port="2" to-layer="6614" to-port="0" /> + <edge from-layer="6614" from-port="1" to-layer="6615" to-port="1" /> + <edge from-layer="6615" from-port="2" to-layer="6616" to-port="1" /> + <edge from-layer="6616" from-port="2" to-layer="6617" to-port="1" /> + <edge from-layer="6617" from-port="2" to-layer="6640" to-port="0" /> + <edge from-layer="6617" from-port="2" to-layer="6628" to-port="0" /> + <edge from-layer="6618" from-port="0" to-layer="6619" to-port="0" /> + <edge from-layer="6619" from-port="1" to-layer="6622" to-port="0" /> + <edge from-layer="6620" from-port="0" to-layer="6621" to-port="0" /> + <edge from-layer="6621" from-port="1" to-layer="6622" to-port="1" /> + <edge from-layer="6622" from-port="2" to-layer="6624" to-port="0" /> + <edge from-layer="6623" from-port="0" to-layer="6624" to-port="1" /> + <edge from-layer="6624" from-port="2" to-layer="6626" to-port="0" /> + <edge from-layer="6625" from-port="0" to-layer="6626" to-port="1" /> + <edge from-layer="6626" from-port="2" to-layer="6627" to-port="0" /> + <edge from-layer="6627" from-port="1" to-layer="6628" to-port="1" /> + <edge from-layer="6628" from-port="2" to-layer="6629" to-port="0" /> + <edge from-layer="6629" from-port="1" to-layer="6641" to-port="0" /> + <edge from-layer="6630" from-port="0" to-layer="6631" to-port="0" /> + <edge from-layer="6631" from-port="1" to-layer="6634" to-port="0" /> + <edge from-layer="6632" from-port="0" to-layer="6633" to-port="0" /> + <edge from-layer="6633" from-port="1" to-layer="6634" to-port="1" /> + <edge from-layer="6634" from-port="2" to-layer="6636" to-port="0" /> + <edge from-layer="6635" from-port="0" to-layer="6636" to-port="1" /> + <edge from-layer="6636" from-port="2" to-layer="6638" to-port="0" /> + <edge from-layer="6637" from-port="0" to-layer="6638" to-port="1" /> + <edge from-layer="6638" from-port="2" to-layer="6639" to-port="0" /> + <edge from-layer="6639" from-port="1" to-layer="6640" to-port="1" /> + <edge from-layer="6640" from-port="2" to-layer="6641" to-port="1" /> + <edge from-layer="6641" from-port="2" to-layer="6652" to-port="0" /> + <edge from-layer="6642" from-port="0" to-layer="6643" to-port="0" /> + <edge from-layer="6643" from-port="1" to-layer="6646" to-port="0" /> + <edge from-layer="6644" from-port="0" to-layer="6645" to-port="0" /> + <edge from-layer="6645" from-port="1" to-layer="6646" to-port="1" /> + <edge from-layer="6646" from-port="2" to-layer="6648" to-port="0" /> + <edge from-layer="6647" from-port="0" to-layer="6648" to-port="1" /> + <edge from-layer="6648" from-port="2" to-layer="6650" to-port="0" /> + <edge from-layer="6649" from-port="0" to-layer="6650" to-port="1" /> + <edge from-layer="6650" from-port="2" to-layer="6651" to-port="0" /> + <edge from-layer="6651" from-port="1" to-layer="6652" to-port="1" /> + <edge from-layer="6652" from-port="2" to-layer="6653" to-port="1" /> + <edge from-layer="6653" from-port="2" to-layer="6657" to-port="0" /> + <edge from-layer="6653" from-port="2" to-layer="6664" to-port="0" /> + <edge from-layer="6653" from-port="2" to-layer="6837" to-port="0" /> + <edge from-layer="6654" from-port="0" to-layer="6665" to-port="0" /> + <edge from-layer="6655" from-port="0" to-layer="6663" to-port="0" /> + <edge from-layer="6656" from-port="0" to-layer="6657" to-port="1" /> + <edge from-layer="6657" from-port="2" to-layer="6659" to-port="0" /> + <edge from-layer="6658" from-port="0" to-layer="6659" to-port="1" /> + <edge from-layer="6659" from-port="2" to-layer="6661" to-port="0" /> + <edge from-layer="6660" from-port="0" to-layer="6661" to-port="1" /> + <edge from-layer="6661" from-port="2" to-layer="6662" to-port="0" /> + <edge from-layer="6662" from-port="1" to-layer="6663" to-port="1" /> + <edge from-layer="6663" from-port="2" to-layer="6664" to-port="1" /> + <edge from-layer="6664" from-port="2" to-layer="6665" to-port="1" /> + <edge from-layer="6665" from-port="2" to-layer="6724" to-port="0" /> + <edge from-layer="6665" from-port="2" to-layer="6676" to-port="0" /> + <edge from-layer="6665" from-port="2" to-layer="6786" to-port="0" /> + <edge from-layer="6666" from-port="0" to-layer="6667" to-port="0" /> + <edge from-layer="6667" from-port="1" to-layer="6670" to-port="0" /> + <edge from-layer="6668" from-port="0" to-layer="6669" to-port="0" /> + <edge from-layer="6669" from-port="1" to-layer="6670" to-port="1" /> + <edge from-layer="6670" from-port="2" to-layer="6672" to-port="0" /> + <edge from-layer="6671" from-port="0" to-layer="6672" to-port="1" /> + <edge from-layer="6672" from-port="2" to-layer="6674" to-port="0" /> + <edge from-layer="6673" from-port="0" to-layer="6674" to-port="1" /> + <edge from-layer="6674" from-port="2" to-layer="6675" to-port="0" /> + <edge from-layer="6675" from-port="1" to-layer="6676" to-port="1" /> + <edge from-layer="6676" from-port="2" to-layer="6679" to-port="0" /> + <edge from-layer="6677" from-port="0" to-layer="6678" to-port="0" /> + <edge from-layer="6678" from-port="1" to-layer="6679" to-port="1" /> + <edge from-layer="6679" from-port="2" to-layer="6681" to-port="0" /> + <edge from-layer="6680" from-port="0" to-layer="6681" to-port="1" /> + <edge from-layer="6681" from-port="2" to-layer="6683" to-port="0" /> + <edge from-layer="6682" from-port="0" to-layer="6683" to-port="1" /> + <edge from-layer="6683" from-port="2" to-layer="6695" to-port="0" /> + <edge from-layer="6683" from-port="2" to-layer="6684" to-port="0" /> + <edge from-layer="6683" from-port="2" to-layer="6685" to-port="0" /> + <edge from-layer="6683" from-port="2" to-layer="6701" to-port="0" /> + <edge from-layer="6684" from-port="2" to-layer="6704" to-port="0" /> + <edge from-layer="6685" from-port="1" to-layer="6687" to-port="0" /> + <edge from-layer="6686" from-port="0" to-layer="6687" to-port="2" /> + <edge from-layer="6687" from-port="3" to-layer="6688" to-port="0" /> + <edge from-layer="6688" from-port="2" to-layer="6689" to-port="0" /> + <edge from-layer="6689" from-port="1" to-layer="6691" to-port="0" /> + <edge from-layer="6690" from-port="0" to-layer="6691" to-port="1" /> + <edge from-layer="6691" from-port="2" to-layer="6701" to-port="2" /> + <edge from-layer="6691" from-port="2" to-layer="6695" to-port="1" /> + <edge from-layer="6692" from-port="0" to-layer="6695" to-port="2" /> + <edge from-layer="6693" from-port="0" to-layer="6695" to-port="3" /> + <edge from-layer="6694" from-port="0" to-layer="6695" to-port="4" /> + <edge from-layer="6695" from-port="5" to-layer="6697" to-port="0" /> + <edge from-layer="6696" from-port="0" to-layer="6697" to-port="1" /> + <edge from-layer="6697" from-port="2" to-layer="6702" to-port="0" /> + <edge from-layer="6698" from-port="0" to-layer="6701" to-port="1" /> + <edge from-layer="6699" from-port="0" to-layer="6701" to-port="3" /> + <edge from-layer="6700" from-port="0" to-layer="6701" to-port="4" /> + <edge from-layer="6701" from-port="5" to-layer="6702" to-port="1" /> + <edge from-layer="6702" from-port="2" to-layer="6703" to-port="0" /> + <edge from-layer="6703" from-port="2" to-layer="6704" to-port="1" /> + <edge from-layer="6704" from-port="2" to-layer="6821" to-port="0" /> + <edge from-layer="6705" from-port="0" to-layer="6710" to-port="0" /> + <edge from-layer="6706" from-port="0" to-layer="6709" to-port="1" /> + <edge from-layer="6707" from-port="0" to-layer="6709" to-port="2" /> + <edge from-layer="6708" from-port="0" to-layer="6709" to-port="3" /> + <edge from-layer="6709" from-port="4" to-layer="6710" to-port="1" /> + <edge from-layer="6710" from-port="2" to-layer="6711" to-port="0" /> + <edge from-layer="6711" from-port="1" to-layer="6713" to-port="0" /> + <edge from-layer="6712" from-port="0" to-layer="6713" to-port="2" /> + <edge from-layer="6713" from-port="3" to-layer="6809" to-port="0" /> + <edge from-layer="6713" from-port="3" to-layer="6753" to-port="0" /> + <edge from-layer="6714" from-port="0" to-layer="6715" to-port="0" /> + <edge from-layer="6715" from-port="1" to-layer="6718" to-port="0" /> + <edge from-layer="6716" from-port="0" to-layer="6717" to-port="0" /> + <edge from-layer="6717" from-port="1" to-layer="6718" to-port="1" /> + <edge from-layer="6718" from-port="2" to-layer="6720" to-port="0" /> + <edge from-layer="6719" from-port="0" to-layer="6720" to-port="1" /> + <edge from-layer="6720" from-port="2" to-layer="6722" to-port="0" /> + <edge from-layer="6721" from-port="0" to-layer="6722" to-port="1" /> + <edge from-layer="6722" from-port="2" to-layer="6723" to-port="0" /> + <edge from-layer="6723" from-port="1" to-layer="6724" to-port="1" /> + <edge from-layer="6724" from-port="2" to-layer="6727" to-port="0" /> + <edge from-layer="6725" from-port="0" to-layer="6726" to-port="0" /> + <edge from-layer="6726" from-port="1" to-layer="6727" to-port="1" /> + <edge from-layer="6727" from-port="2" to-layer="6729" to-port="0" /> + <edge from-layer="6728" from-port="0" to-layer="6729" to-port="1" /> + <edge from-layer="6729" from-port="2" to-layer="6731" to-port="0" /> + <edge from-layer="6730" from-port="0" to-layer="6731" to-port="1" /> + <edge from-layer="6731" from-port="2" to-layer="6733" to-port="0" /> + <edge from-layer="6731" from-port="2" to-layer="6743" to-port="0" /> + <edge from-layer="6731" from-port="2" to-layer="6732" to-port="0" /> + <edge from-layer="6731" from-port="2" to-layer="6749" to-port="0" /> + <edge from-layer="6732" from-port="2" to-layer="6752" to-port="0" /> + <edge from-layer="6733" from-port="1" to-layer="6735" to-port="0" /> + <edge from-layer="6734" from-port="0" to-layer="6735" to-port="2" /> + <edge from-layer="6735" from-port="3" to-layer="6736" to-port="0" /> + <edge from-layer="6736" from-port="2" to-layer="6737" to-port="0" /> + <edge from-layer="6737" from-port="1" to-layer="6739" to-port="0" /> + <edge from-layer="6738" from-port="0" to-layer="6739" to-port="1" /> + <edge from-layer="6739" from-port="2" to-layer="6743" to-port="1" /> + <edge from-layer="6739" from-port="2" to-layer="6749" to-port="2" /> + <edge from-layer="6740" from-port="0" to-layer="6743" to-port="2" /> + <edge from-layer="6741" from-port="0" to-layer="6743" to-port="3" /> + <edge from-layer="6742" from-port="0" to-layer="6743" to-port="4" /> + <edge from-layer="6743" from-port="5" to-layer="6745" to-port="0" /> + <edge from-layer="6744" from-port="0" to-layer="6745" to-port="1" /> + <edge from-layer="6745" from-port="2" to-layer="6750" to-port="0" /> + <edge from-layer="6746" from-port="0" to-layer="6749" to-port="1" /> + <edge from-layer="6747" from-port="0" to-layer="6749" to-port="3" /> + <edge from-layer="6748" from-port="0" to-layer="6749" to-port="4" /> + <edge from-layer="6749" from-port="5" to-layer="6750" to-port="1" /> + <edge from-layer="6750" from-port="2" to-layer="6751" to-port="0" /> + <edge from-layer="6751" from-port="2" to-layer="6752" to-port="1" /> + <edge from-layer="6752" from-port="2" to-layer="6813" to-port="0" /> + <edge from-layer="6752" from-port="2" to-layer="6753" to-port="1" /> + <edge from-layer="6753" from-port="2" to-layer="6754" to-port="0" /> + <edge from-layer="6753" from-port="2" to-layer="6755" to-port="0" /> + <edge from-layer="6753" from-port="2" to-layer="11184" to-port="0" /> + <edge from-layer="6754" from-port="2" to-layer="6764" to-port="0" /> + <edge from-layer="6755" from-port="1" to-layer="6758" to-port="0" /> + <edge from-layer="6755" from-port="1" to-layer="6762" to-port="0" /> + <edge from-layer="6756" from-port="0" to-layer="6758" to-port="1" /> + <edge from-layer="6757" from-port="0" to-layer="6758" to-port="2" /> + <edge from-layer="6758" from-port="3" to-layer="6763" to-port="0" /> + <edge from-layer="6759" from-port="0" to-layer="6763" to-port="1" /> + <edge from-layer="6760" from-port="0" to-layer="6762" to-port="1" /> + <edge from-layer="6761" from-port="0" to-layer="6762" to-port="2" /> + <edge from-layer="6762" from-port="3" to-layer="6763" to-port="2" /> + <edge from-layer="6763" from-port="3" to-layer="6764" to-port="1" /> + <edge from-layer="6764" from-port="2" to-layer="6766" to-port="0" /> + <edge from-layer="6765" from-port="0" to-layer="6766" to-port="1" /> + <edge from-layer="6766" from-port="2" to-layer="6821" to-port="1" /> + <edge from-layer="6767" from-port="0" to-layer="6772" to-port="0" /> + <edge from-layer="6768" from-port="0" to-layer="6771" to-port="1" /> + <edge from-layer="6769" from-port="0" to-layer="6771" to-port="2" /> + <edge from-layer="6770" from-port="0" to-layer="6771" to-port="3" /> + <edge from-layer="6771" from-port="4" to-layer="6772" to-port="1" /> + <edge from-layer="6772" from-port="2" to-layer="6773" to-port="0" /> + <edge from-layer="6773" from-port="1" to-layer="6775" to-port="0" /> + <edge from-layer="6774" from-port="0" to-layer="6775" to-port="2" /> + <edge from-layer="6775" from-port="3" to-layer="6794" to-port="0" /> + <edge from-layer="6776" from-port="0" to-layer="6777" to-port="0" /> + <edge from-layer="6777" from-port="1" to-layer="6780" to-port="0" /> + <edge from-layer="6778" from-port="0" to-layer="6779" to-port="0" /> + <edge from-layer="6779" from-port="1" to-layer="6780" to-port="1" /> + <edge from-layer="6780" from-port="2" to-layer="6782" to-port="0" /> + <edge from-layer="6781" from-port="0" to-layer="6782" to-port="1" /> + <edge from-layer="6782" from-port="2" to-layer="6784" to-port="0" /> + <edge from-layer="6783" from-port="0" to-layer="6784" to-port="1" /> + <edge from-layer="6784" from-port="2" to-layer="6785" to-port="0" /> + <edge from-layer="6785" from-port="1" to-layer="6786" to-port="1" /> + <edge from-layer="6786" from-port="2" to-layer="6789" to-port="0" /> + <edge from-layer="6787" from-port="0" to-layer="6788" to-port="0" /> + <edge from-layer="6788" from-port="1" to-layer="6789" to-port="1" /> + <edge from-layer="6789" from-port="2" to-layer="6791" to-port="0" /> + <edge from-layer="6790" from-port="0" to-layer="6791" to-port="1" /> + <edge from-layer="6791" from-port="2" to-layer="6793" to-port="0" /> + <edge from-layer="6792" from-port="0" to-layer="6793" to-port="1" /> + <edge from-layer="6793" from-port="2" to-layer="6794" to-port="1" /> + <edge from-layer="6794" from-port="2" to-layer="6795" to-port="0" /> + <edge from-layer="6794" from-port="2" to-layer="6796" to-port="0" /> + <edge from-layer="6794" from-port="2" to-layer="11183" to-port="0" /> + <edge from-layer="6795" from-port="2" to-layer="6805" to-port="0" /> + <edge from-layer="6796" from-port="1" to-layer="6799" to-port="0" /> + <edge from-layer="6796" from-port="1" to-layer="6803" to-port="0" /> + <edge from-layer="6797" from-port="0" to-layer="6799" to-port="1" /> + <edge from-layer="6798" from-port="0" to-layer="6799" to-port="2" /> + <edge from-layer="6799" from-port="3" to-layer="6804" to-port="1" /> + <edge from-layer="6800" from-port="0" to-layer="6804" to-port="2" /> + <edge from-layer="6801" from-port="0" to-layer="6803" to-port="1" /> + <edge from-layer="6802" from-port="0" to-layer="6803" to-port="2" /> + <edge from-layer="6803" from-port="3" to-layer="6804" to-port="3" /> + <edge from-layer="6804" from-port="4" to-layer="6805" to-port="1" /> + <edge from-layer="6805" from-port="2" to-layer="6807" to-port="0" /> + <edge from-layer="6806" from-port="0" to-layer="6807" to-port="1" /> + <edge from-layer="6807" from-port="2" to-layer="6821" to-port="2" /> + <edge from-layer="6808" from-port="0" to-layer="6820" to-port="1" /> + <edge from-layer="6809" from-port="1" to-layer="6812" to-port="0" /> + <edge from-layer="6810" from-port="0" to-layer="6812" to-port="1" /> + <edge from-layer="6811" from-port="0" to-layer="6812" to-port="2" /> + <edge from-layer="6812" from-port="3" to-layer="6817" to-port="0" /> + <edge from-layer="6813" from-port="1" to-layer="6816" to-port="0" /> + <edge from-layer="6814" from-port="0" to-layer="6816" to-port="1" /> + <edge from-layer="6815" from-port="0" to-layer="6816" to-port="2" /> + <edge from-layer="6816" from-port="3" to-layer="6817" to-port="1" /> + <edge from-layer="6817" from-port="2" to-layer="6820" to-port="2" /> + <edge from-layer="6818" from-port="0" to-layer="6820" to-port="3" /> + <edge from-layer="6819" from-port="0" to-layer="6820" to-port="4" /> + <edge from-layer="6820" from-port="5" to-layer="6821" to-port="3" /> + <edge from-layer="6821" from-port="4" to-layer="6823" to-port="0" /> + <edge from-layer="6822" from-port="0" to-layer="6823" to-port="1" /> + <edge from-layer="6823" from-port="2" to-layer="6825" to-port="0" /> + <edge from-layer="6824" from-port="0" to-layer="6825" to-port="1" /> + <edge from-layer="6825" from-port="2" to-layer="6836" to-port="0" /> + <edge from-layer="6826" from-port="0" to-layer="6827" to-port="0" /> + <edge from-layer="6827" from-port="1" to-layer="6830" to-port="0" /> + <edge from-layer="6828" from-port="0" to-layer="6829" to-port="0" /> + <edge from-layer="6829" from-port="1" to-layer="6830" to-port="1" /> + <edge from-layer="6830" from-port="2" to-layer="6832" to-port="0" /> + <edge from-layer="6831" from-port="0" to-layer="6832" to-port="1" /> + <edge from-layer="6832" from-port="2" to-layer="6834" to-port="0" /> + <edge from-layer="6833" from-port="0" to-layer="6834" to-port="1" /> + <edge from-layer="6834" from-port="2" to-layer="6835" to-port="0" /> + <edge from-layer="6835" from-port="1" to-layer="6836" to-port="1" /> + <edge from-layer="6836" from-port="2" to-layer="6837" to-port="1" /> + <edge from-layer="6837" from-port="2" to-layer="6841" to-port="0" /> + <edge from-layer="6837" from-port="2" to-layer="6885" to-port="0" /> + <edge from-layer="6837" from-port="2" to-layer="6848" to-port="0" /> + <edge from-layer="6838" from-port="0" to-layer="6849" to-port="0" /> + <edge from-layer="6839" from-port="0" to-layer="6847" to-port="0" /> + <edge from-layer="6840" from-port="0" to-layer="6841" to-port="1" /> + <edge from-layer="6841" from-port="2" to-layer="6843" to-port="0" /> + <edge from-layer="6842" from-port="0" to-layer="6843" to-port="1" /> + <edge from-layer="6843" from-port="2" to-layer="6845" to-port="0" /> + <edge from-layer="6844" from-port="0" to-layer="6845" to-port="1" /> + <edge from-layer="6845" from-port="2" to-layer="6846" to-port="0" /> + <edge from-layer="6846" from-port="1" to-layer="6847" to-port="1" /> + <edge from-layer="6847" from-port="2" to-layer="6848" to-port="1" /> + <edge from-layer="6848" from-port="2" to-layer="6849" to-port="1" /> + <edge from-layer="6849" from-port="2" to-layer="6872" to-port="0" /> + <edge from-layer="6849" from-port="2" to-layer="6860" to-port="0" /> + <edge from-layer="6850" from-port="0" to-layer="6851" to-port="0" /> + <edge from-layer="6851" from-port="1" to-layer="6854" to-port="0" /> + <edge from-layer="6852" from-port="0" to-layer="6853" to-port="0" /> + <edge from-layer="6853" from-port="1" to-layer="6854" to-port="1" /> + <edge from-layer="6854" from-port="2" to-layer="6856" to-port="0" /> + <edge from-layer="6855" from-port="0" to-layer="6856" to-port="1" /> + <edge from-layer="6856" from-port="2" to-layer="6858" to-port="0" /> + <edge from-layer="6857" from-port="0" to-layer="6858" to-port="1" /> + <edge from-layer="6858" from-port="2" to-layer="6859" to-port="0" /> + <edge from-layer="6859" from-port="1" to-layer="6860" to-port="1" /> + <edge from-layer="6860" from-port="2" to-layer="6861" to-port="0" /> + <edge from-layer="6861" from-port="1" to-layer="6873" to-port="0" /> + <edge from-layer="6862" from-port="0" to-layer="6863" to-port="0" /> + <edge from-layer="6863" from-port="1" to-layer="6866" to-port="0" /> + <edge from-layer="6864" from-port="0" to-layer="6865" to-port="0" /> + <edge from-layer="6865" from-port="1" to-layer="6866" to-port="1" /> + <edge from-layer="6866" from-port="2" to-layer="6868" to-port="0" /> + <edge from-layer="6867" from-port="0" to-layer="6868" to-port="1" /> + <edge from-layer="6868" from-port="2" to-layer="6870" to-port="0" /> + <edge from-layer="6869" from-port="0" to-layer="6870" to-port="1" /> + <edge from-layer="6870" from-port="2" to-layer="6871" to-port="0" /> + <edge from-layer="6871" from-port="1" to-layer="6872" to-port="1" /> + <edge from-layer="6872" from-port="2" to-layer="6873" to-port="1" /> + <edge from-layer="6873" from-port="2" to-layer="6884" to-port="0" /> + <edge from-layer="6874" from-port="0" to-layer="6875" to-port="0" /> + <edge from-layer="6875" from-port="1" to-layer="6878" to-port="0" /> + <edge from-layer="6876" from-port="0" to-layer="6877" to-port="0" /> + <edge from-layer="6877" from-port="1" to-layer="6878" to-port="1" /> + <edge from-layer="6878" from-port="2" to-layer="6880" to-port="0" /> + <edge from-layer="6879" from-port="0" to-layer="6880" to-port="1" /> + <edge from-layer="6880" from-port="2" to-layer="6882" to-port="0" /> + <edge from-layer="6881" from-port="0" to-layer="6882" to-port="1" /> + <edge from-layer="6882" from-port="2" to-layer="6883" to-port="0" /> + <edge from-layer="6883" from-port="1" to-layer="6884" to-port="1" /> + <edge from-layer="6884" from-port="2" to-layer="6885" to-port="1" /> + <edge from-layer="6885" from-port="2" to-layer="6896" to-port="0" /> + <edge from-layer="6885" from-port="2" to-layer="6889" to-port="0" /> + <edge from-layer="6885" from-port="2" to-layer="7069" to-port="0" /> + <edge from-layer="6886" from-port="0" to-layer="6897" to-port="0" /> + <edge from-layer="6887" from-port="0" to-layer="6895" to-port="0" /> + <edge from-layer="6888" from-port="0" to-layer="6889" to-port="1" /> + <edge from-layer="6889" from-port="2" to-layer="6891" to-port="0" /> + <edge from-layer="6890" from-port="0" to-layer="6891" to-port="1" /> + <edge from-layer="6891" from-port="2" to-layer="6893" to-port="0" /> + <edge from-layer="6892" from-port="0" to-layer="6893" to-port="1" /> + <edge from-layer="6893" from-port="2" to-layer="6894" to-port="0" /> + <edge from-layer="6894" from-port="1" to-layer="6895" to-port="1" /> + <edge from-layer="6895" from-port="2" to-layer="6896" to-port="1" /> + <edge from-layer="6896" from-port="2" to-layer="6897" to-port="1" /> + <edge from-layer="6897" from-port="2" to-layer="6908" to-port="0" /> + <edge from-layer="6897" from-port="2" to-layer="7018" to-port="0" /> + <edge from-layer="6897" from-port="2" to-layer="6956" to-port="0" /> + <edge from-layer="6898" from-port="0" to-layer="6899" to-port="0" /> + <edge from-layer="6899" from-port="1" to-layer="6902" to-port="0" /> + <edge from-layer="6900" from-port="0" to-layer="6901" to-port="0" /> + <edge from-layer="6901" from-port="1" to-layer="6902" to-port="1" /> + <edge from-layer="6902" from-port="2" to-layer="6904" to-port="0" /> + <edge from-layer="6903" from-port="0" to-layer="6904" to-port="1" /> + <edge from-layer="6904" from-port="2" to-layer="6906" to-port="0" /> + <edge from-layer="6905" from-port="0" to-layer="6906" to-port="1" /> + <edge from-layer="6906" from-port="2" to-layer="6907" to-port="0" /> + <edge from-layer="6907" from-port="1" to-layer="6908" to-port="1" /> + <edge from-layer="6908" from-port="2" to-layer="6911" to-port="0" /> + <edge from-layer="6909" from-port="0" to-layer="6910" to-port="0" /> + <edge from-layer="6910" from-port="1" to-layer="6911" to-port="1" /> + <edge from-layer="6911" from-port="2" to-layer="6913" to-port="0" /> + <edge from-layer="6912" from-port="0" to-layer="6913" to-port="1" /> + <edge from-layer="6913" from-port="2" to-layer="6915" to-port="0" /> + <edge from-layer="6914" from-port="0" to-layer="6915" to-port="1" /> + <edge from-layer="6915" from-port="2" to-layer="6917" to-port="0" /> + <edge from-layer="6915" from-port="2" to-layer="6933" to-port="0" /> + <edge from-layer="6915" from-port="2" to-layer="6916" to-port="0" /> + <edge from-layer="6915" from-port="2" to-layer="6927" to-port="0" /> + <edge from-layer="6916" from-port="2" to-layer="6936" to-port="0" /> + <edge from-layer="6917" from-port="1" to-layer="6919" to-port="0" /> + <edge from-layer="6918" from-port="0" to-layer="6919" to-port="2" /> + <edge from-layer="6919" from-port="3" to-layer="6920" to-port="0" /> + <edge from-layer="6920" from-port="2" to-layer="6921" to-port="0" /> + <edge from-layer="6921" from-port="1" to-layer="6923" to-port="0" /> + <edge from-layer="6922" from-port="0" to-layer="6923" to-port="1" /> + <edge from-layer="6923" from-port="2" to-layer="6933" to-port="2" /> + <edge from-layer="6923" from-port="2" to-layer="6927" to-port="1" /> + <edge from-layer="6924" from-port="0" to-layer="6927" to-port="2" /> + <edge from-layer="6925" from-port="0" to-layer="6927" to-port="3" /> + <edge from-layer="6926" from-port="0" to-layer="6927" to-port="4" /> + <edge from-layer="6927" from-port="5" to-layer="6929" to-port="0" /> + <edge from-layer="6928" from-port="0" to-layer="6929" to-port="1" /> + <edge from-layer="6929" from-port="2" to-layer="6934" to-port="0" /> + <edge from-layer="6930" from-port="0" to-layer="6933" to-port="1" /> + <edge from-layer="6931" from-port="0" to-layer="6933" to-port="3" /> + <edge from-layer="6932" from-port="0" to-layer="6933" to-port="4" /> + <edge from-layer="6933" from-port="5" to-layer="6934" to-port="1" /> + <edge from-layer="6934" from-port="2" to-layer="6935" to-port="0" /> + <edge from-layer="6935" from-port="2" to-layer="6936" to-port="1" /> + <edge from-layer="6936" from-port="2" to-layer="7053" to-port="0" /> + <edge from-layer="6937" from-port="0" to-layer="6942" to-port="0" /> + <edge from-layer="6938" from-port="0" to-layer="6941" to-port="1" /> + <edge from-layer="6939" from-port="0" to-layer="6941" to-port="2" /> + <edge from-layer="6940" from-port="0" to-layer="6941" to-port="3" /> + <edge from-layer="6941" from-port="4" to-layer="6942" to-port="1" /> + <edge from-layer="6942" from-port="2" to-layer="6943" to-port="0" /> + <edge from-layer="6943" from-port="1" to-layer="6945" to-port="0" /> + <edge from-layer="6944" from-port="0" to-layer="6945" to-port="2" /> + <edge from-layer="6945" from-port="3" to-layer="7041" to-port="0" /> + <edge from-layer="6945" from-port="3" to-layer="6985" to-port="0" /> + <edge from-layer="6946" from-port="0" to-layer="6947" to-port="0" /> + <edge from-layer="6947" from-port="1" to-layer="6950" to-port="0" /> + <edge from-layer="6948" from-port="0" to-layer="6949" to-port="0" /> + <edge from-layer="6949" from-port="1" to-layer="6950" to-port="1" /> + <edge from-layer="6950" from-port="2" to-layer="6952" to-port="0" /> + <edge from-layer="6951" from-port="0" to-layer="6952" to-port="1" /> + <edge from-layer="6952" from-port="2" to-layer="6954" to-port="0" /> + <edge from-layer="6953" from-port="0" to-layer="6954" to-port="1" /> + <edge from-layer="6954" from-port="2" to-layer="6955" to-port="0" /> + <edge from-layer="6955" from-port="1" to-layer="6956" to-port="1" /> + <edge from-layer="6956" from-port="2" to-layer="6959" to-port="0" /> + <edge from-layer="6957" from-port="0" to-layer="6958" to-port="0" /> + <edge from-layer="6958" from-port="1" to-layer="6959" to-port="1" /> + <edge from-layer="6959" from-port="2" to-layer="6961" to-port="0" /> + <edge from-layer="6960" from-port="0" to-layer="6961" to-port="1" /> + <edge from-layer="6961" from-port="2" to-layer="6963" to-port="0" /> + <edge from-layer="6962" from-port="0" to-layer="6963" to-port="1" /> + <edge from-layer="6963" from-port="2" to-layer="6981" to-port="0" /> + <edge from-layer="6963" from-port="2" to-layer="6975" to-port="0" /> + <edge from-layer="6963" from-port="2" to-layer="6964" to-port="0" /> + <edge from-layer="6963" from-port="2" to-layer="6965" to-port="0" /> + <edge from-layer="6964" from-port="2" to-layer="6984" to-port="0" /> + <edge from-layer="6965" from-port="1" to-layer="6967" to-port="0" /> + <edge from-layer="6966" from-port="0" to-layer="6967" to-port="2" /> + <edge from-layer="6967" from-port="3" to-layer="6968" to-port="0" /> + <edge from-layer="6968" from-port="2" to-layer="6969" to-port="0" /> + <edge from-layer="6969" from-port="1" to-layer="6971" to-port="0" /> + <edge from-layer="6970" from-port="0" to-layer="6971" to-port="1" /> + <edge from-layer="6971" from-port="2" to-layer="6975" to-port="1" /> + <edge from-layer="6971" from-port="2" to-layer="6981" to-port="2" /> + <edge from-layer="6972" from-port="0" to-layer="6975" to-port="2" /> + <edge from-layer="6973" from-port="0" to-layer="6975" to-port="3" /> + <edge from-layer="6974" from-port="0" to-layer="6975" to-port="4" /> + <edge from-layer="6975" from-port="5" to-layer="6977" to-port="0" /> + <edge from-layer="6976" from-port="0" to-layer="6977" to-port="1" /> + <edge from-layer="6977" from-port="2" to-layer="6982" to-port="0" /> + <edge from-layer="6978" from-port="0" to-layer="6981" to-port="1" /> + <edge from-layer="6979" from-port="0" to-layer="6981" to-port="3" /> + <edge from-layer="6980" from-port="0" to-layer="6981" to-port="4" /> + <edge from-layer="6981" from-port="5" to-layer="6982" to-port="1" /> + <edge from-layer="6982" from-port="2" to-layer="6983" to-port="0" /> + <edge from-layer="6983" from-port="2" to-layer="6984" to-port="1" /> + <edge from-layer="6984" from-port="2" to-layer="6985" to-port="1" /> + <edge from-layer="6984" from-port="2" to-layer="7045" to-port="0" /> + <edge from-layer="6985" from-port="2" to-layer="6987" to-port="0" /> + <edge from-layer="6985" from-port="2" to-layer="11182" to-port="0" /> + <edge from-layer="6985" from-port="2" to-layer="6986" to-port="0" /> + <edge from-layer="6986" from-port="2" to-layer="6996" to-port="0" /> + <edge from-layer="6987" from-port="1" to-layer="6990" to-port="0" /> + <edge from-layer="6987" from-port="1" to-layer="6994" to-port="0" /> + <edge from-layer="6988" from-port="0" to-layer="6990" to-port="1" /> + <edge from-layer="6989" from-port="0" to-layer="6990" to-port="2" /> + <edge from-layer="6990" from-port="3" to-layer="6995" to-port="0" /> + <edge from-layer="6991" from-port="0" to-layer="6995" to-port="1" /> + <edge from-layer="6992" from-port="0" to-layer="6994" to-port="1" /> + <edge from-layer="6993" from-port="0" to-layer="6994" to-port="2" /> + <edge from-layer="6994" from-port="3" to-layer="6995" to-port="2" /> + <edge from-layer="6995" from-port="3" to-layer="6996" to-port="1" /> + <edge from-layer="6996" from-port="2" to-layer="6998" to-port="0" /> + <edge from-layer="6997" from-port="0" to-layer="6998" to-port="1" /> + <edge from-layer="6998" from-port="2" to-layer="7053" to-port="1" /> + <edge from-layer="6999" from-port="0" to-layer="7004" to-port="0" /> + <edge from-layer="7000" from-port="0" to-layer="7003" to-port="1" /> + <edge from-layer="7001" from-port="0" to-layer="7003" to-port="2" /> + <edge from-layer="7002" from-port="0" to-layer="7003" to-port="3" /> + <edge from-layer="7003" from-port="4" to-layer="7004" to-port="1" /> + <edge from-layer="7004" from-port="2" to-layer="7005" to-port="0" /> + <edge from-layer="7005" from-port="1" to-layer="7007" to-port="0" /> + <edge from-layer="7006" from-port="0" to-layer="7007" to-port="2" /> + <edge from-layer="7007" from-port="3" to-layer="7026" to-port="0" /> + <edge from-layer="7008" from-port="0" to-layer="7009" to-port="0" /> + <edge from-layer="7009" from-port="1" to-layer="7012" to-port="0" /> + <edge from-layer="7010" from-port="0" to-layer="7011" to-port="0" /> + <edge from-layer="7011" from-port="1" to-layer="7012" to-port="1" /> + <edge from-layer="7012" from-port="2" to-layer="7014" to-port="0" /> + <edge from-layer="7013" from-port="0" to-layer="7014" to-port="1" /> + <edge from-layer="7014" from-port="2" to-layer="7016" to-port="0" /> + <edge from-layer="7015" from-port="0" to-layer="7016" to-port="1" /> + <edge from-layer="7016" from-port="2" to-layer="7017" to-port="0" /> + <edge from-layer="7017" from-port="1" to-layer="7018" to-port="1" /> + <edge from-layer="7018" from-port="2" to-layer="7021" to-port="0" /> + <edge from-layer="7019" from-port="0" to-layer="7020" to-port="0" /> + <edge from-layer="7020" from-port="1" to-layer="7021" to-port="1" /> + <edge from-layer="7021" from-port="2" to-layer="7023" to-port="0" /> + <edge from-layer="7022" from-port="0" to-layer="7023" to-port="1" /> + <edge from-layer="7023" from-port="2" to-layer="7025" to-port="0" /> + <edge from-layer="7024" from-port="0" to-layer="7025" to-port="1" /> + <edge from-layer="7025" from-port="2" to-layer="7026" to-port="1" /> + <edge from-layer="7026" from-port="2" to-layer="7027" to-port="0" /> + <edge from-layer="7026" from-port="2" to-layer="11181" to-port="0" /> + <edge from-layer="7026" from-port="2" to-layer="7028" to-port="0" /> + <edge from-layer="7027" from-port="2" to-layer="7037" to-port="0" /> + <edge from-layer="7028" from-port="1" to-layer="7035" to-port="0" /> + <edge from-layer="7028" from-port="1" to-layer="7031" to-port="0" /> + <edge from-layer="7029" from-port="0" to-layer="7031" to-port="1" /> + <edge from-layer="7030" from-port="0" to-layer="7031" to-port="2" /> + <edge from-layer="7031" from-port="3" to-layer="7036" to-port="1" /> + <edge from-layer="7032" from-port="0" to-layer="7036" to-port="2" /> + <edge from-layer="7033" from-port="0" to-layer="7035" to-port="1" /> + <edge from-layer="7034" from-port="0" to-layer="7035" to-port="2" /> + <edge from-layer="7035" from-port="3" to-layer="7036" to-port="3" /> + <edge from-layer="7036" from-port="4" to-layer="7037" to-port="1" /> + <edge from-layer="7037" from-port="2" to-layer="7039" to-port="0" /> + <edge from-layer="7038" from-port="0" to-layer="7039" to-port="1" /> + <edge from-layer="7039" from-port="2" to-layer="7053" to-port="2" /> + <edge from-layer="7040" from-port="0" to-layer="7052" to-port="1" /> + <edge from-layer="7041" from-port="1" to-layer="7044" to-port="0" /> + <edge from-layer="7042" from-port="0" to-layer="7044" to-port="1" /> + <edge from-layer="7043" from-port="0" to-layer="7044" to-port="2" /> + <edge from-layer="7044" from-port="3" to-layer="7049" to-port="0" /> + <edge from-layer="7045" from-port="1" to-layer="7048" to-port="0" /> + <edge from-layer="7046" from-port="0" to-layer="7048" to-port="1" /> + <edge from-layer="7047" from-port="0" to-layer="7048" to-port="2" /> + <edge from-layer="7048" from-port="3" to-layer="7049" to-port="1" /> + <edge from-layer="7049" from-port="2" to-layer="7052" to-port="2" /> + <edge from-layer="7050" from-port="0" to-layer="7052" to-port="3" /> + <edge from-layer="7051" from-port="0" to-layer="7052" to-port="4" /> + <edge from-layer="7052" from-port="5" to-layer="7053" to-port="3" /> + <edge from-layer="7053" from-port="4" to-layer="7055" to-port="0" /> + <edge from-layer="7054" from-port="0" to-layer="7055" to-port="1" /> + <edge from-layer="7055" from-port="2" to-layer="7057" to-port="0" /> + <edge from-layer="7056" from-port="0" to-layer="7057" to-port="1" /> + <edge from-layer="7057" from-port="2" to-layer="7068" to-port="0" /> + <edge from-layer="7058" from-port="0" to-layer="7059" to-port="0" /> + <edge from-layer="7059" from-port="1" to-layer="7062" to-port="0" /> + <edge from-layer="7060" from-port="0" to-layer="7061" to-port="0" /> + <edge from-layer="7061" from-port="1" to-layer="7062" to-port="1" /> + <edge from-layer="7062" from-port="2" to-layer="7064" to-port="0" /> + <edge from-layer="7063" from-port="0" to-layer="7064" to-port="1" /> + <edge from-layer="7064" from-port="2" to-layer="7066" to-port="0" /> + <edge from-layer="7065" from-port="0" to-layer="7066" to-port="1" /> + <edge from-layer="7066" from-port="2" to-layer="7067" to-port="0" /> + <edge from-layer="7067" from-port="1" to-layer="7068" to-port="1" /> + <edge from-layer="7068" from-port="2" to-layer="7069" to-port="1" /> + <edge from-layer="7069" from-port="2" to-layer="7117" to-port="0" /> + <edge from-layer="7069" from-port="2" to-layer="7073" to-port="0" /> + <edge from-layer="7069" from-port="2" to-layer="7080" to-port="0" /> + <edge from-layer="7070" from-port="0" to-layer="7081" to-port="0" /> + <edge from-layer="7071" from-port="0" to-layer="7079" to-port="0" /> + <edge from-layer="7072" from-port="0" to-layer="7073" to-port="1" /> + <edge from-layer="7073" from-port="2" to-layer="7075" to-port="0" /> + <edge from-layer="7074" from-port="0" to-layer="7075" to-port="1" /> + <edge from-layer="7075" from-port="2" to-layer="7077" to-port="0" /> + <edge from-layer="7076" from-port="0" to-layer="7077" to-port="1" /> + <edge from-layer="7077" from-port="2" to-layer="7078" to-port="0" /> + <edge from-layer="7078" from-port="1" to-layer="7079" to-port="1" /> + <edge from-layer="7079" from-port="2" to-layer="7080" to-port="1" /> + <edge from-layer="7080" from-port="2" to-layer="7081" to-port="1" /> + <edge from-layer="7081" from-port="2" to-layer="7104" to-port="0" /> + <edge from-layer="7081" from-port="2" to-layer="7092" to-port="0" /> + <edge from-layer="7082" from-port="0" to-layer="7083" to-port="0" /> + <edge from-layer="7083" from-port="1" to-layer="7086" to-port="0" /> + <edge from-layer="7084" from-port="0" to-layer="7085" to-port="0" /> + <edge from-layer="7085" from-port="1" to-layer="7086" to-port="1" /> + <edge from-layer="7086" from-port="2" to-layer="7088" to-port="0" /> + <edge from-layer="7087" from-port="0" to-layer="7088" to-port="1" /> + <edge from-layer="7088" from-port="2" to-layer="7090" to-port="0" /> + <edge from-layer="7089" from-port="0" to-layer="7090" to-port="1" /> + <edge from-layer="7090" from-port="2" to-layer="7091" to-port="0" /> + <edge from-layer="7091" from-port="1" to-layer="7092" to-port="1" /> + <edge from-layer="7092" from-port="2" to-layer="7093" to-port="0" /> + <edge from-layer="7093" from-port="1" to-layer="7105" to-port="0" /> + <edge from-layer="7094" from-port="0" to-layer="7095" to-port="0" /> + <edge from-layer="7095" from-port="1" to-layer="7098" to-port="0" /> + <edge from-layer="7096" from-port="0" to-layer="7097" to-port="0" /> + <edge from-layer="7097" from-port="1" to-layer="7098" to-port="1" /> + <edge from-layer="7098" from-port="2" to-layer="7100" to-port="0" /> + <edge from-layer="7099" from-port="0" to-layer="7100" to-port="1" /> + <edge from-layer="7100" from-port="2" to-layer="7102" to-port="0" /> + <edge from-layer="7101" from-port="0" to-layer="7102" to-port="1" /> + <edge from-layer="7102" from-port="2" to-layer="7103" to-port="0" /> + <edge from-layer="7103" from-port="1" to-layer="7104" to-port="1" /> + <edge from-layer="7104" from-port="2" to-layer="7105" to-port="1" /> + <edge from-layer="7105" from-port="2" to-layer="7116" to-port="0" /> + <edge from-layer="7106" from-port="0" to-layer="7107" to-port="0" /> + <edge from-layer="7107" from-port="1" to-layer="7110" to-port="0" /> + <edge from-layer="7108" from-port="0" to-layer="7109" to-port="0" /> + <edge from-layer="7109" from-port="1" to-layer="7110" to-port="1" /> + <edge from-layer="7110" from-port="2" to-layer="7112" to-port="0" /> + <edge from-layer="7111" from-port="0" to-layer="7112" to-port="1" /> + <edge from-layer="7112" from-port="2" to-layer="7114" to-port="0" /> + <edge from-layer="7113" from-port="0" to-layer="7114" to-port="1" /> + <edge from-layer="7114" from-port="2" to-layer="7115" to-port="0" /> + <edge from-layer="7115" from-port="1" to-layer="7116" to-port="1" /> + <edge from-layer="7116" from-port="2" to-layer="7117" to-port="1" /> + <edge from-layer="7117" from-port="2" to-layer="7128" to-port="0" /> + <edge from-layer="7117" from-port="2" to-layer="7121" to-port="0" /> + <edge from-layer="7117" from-port="2" to-layer="7301" to-port="0" /> + <edge from-layer="7118" from-port="0" to-layer="7129" to-port="0" /> + <edge from-layer="7119" from-port="0" to-layer="7127" to-port="0" /> + <edge from-layer="7120" from-port="0" to-layer="7121" to-port="1" /> + <edge from-layer="7121" from-port="2" to-layer="7123" to-port="0" /> + <edge from-layer="7122" from-port="0" to-layer="7123" to-port="1" /> + <edge from-layer="7123" from-port="2" to-layer="7125" to-port="0" /> + <edge from-layer="7124" from-port="0" to-layer="7125" to-port="1" /> + <edge from-layer="7125" from-port="2" to-layer="7126" to-port="0" /> + <edge from-layer="7126" from-port="1" to-layer="7127" to-port="1" /> + <edge from-layer="7127" from-port="2" to-layer="7128" to-port="1" /> + <edge from-layer="7128" from-port="2" to-layer="7129" to-port="1" /> + <edge from-layer="7129" from-port="2" to-layer="7188" to-port="0" /> + <edge from-layer="7129" from-port="2" to-layer="7250" to-port="0" /> + <edge from-layer="7129" from-port="2" to-layer="7140" to-port="0" /> + <edge from-layer="7130" from-port="0" to-layer="7131" to-port="0" /> + <edge from-layer="7131" from-port="1" to-layer="7134" to-port="0" /> + <edge from-layer="7132" from-port="0" to-layer="7133" to-port="0" /> + <edge from-layer="7133" from-port="1" to-layer="7134" to-port="1" /> + <edge from-layer="7134" from-port="2" to-layer="7136" to-port="0" /> + <edge from-layer="7135" from-port="0" to-layer="7136" to-port="1" /> + <edge from-layer="7136" from-port="2" to-layer="7138" to-port="0" /> + <edge from-layer="7137" from-port="0" to-layer="7138" to-port="1" /> + <edge from-layer="7138" from-port="2" to-layer="7139" to-port="0" /> + <edge from-layer="7139" from-port="1" to-layer="7140" to-port="1" /> + <edge from-layer="7140" from-port="2" to-layer="7143" to-port="0" /> + <edge from-layer="7141" from-port="0" to-layer="7142" to-port="0" /> + <edge from-layer="7142" from-port="1" to-layer="7143" to-port="1" /> + <edge from-layer="7143" from-port="2" to-layer="7145" to-port="0" /> + <edge from-layer="7144" from-port="0" to-layer="7145" to-port="1" /> + <edge from-layer="7145" from-port="2" to-layer="7147" to-port="0" /> + <edge from-layer="7146" from-port="0" to-layer="7147" to-port="1" /> + <edge from-layer="7147" from-port="2" to-layer="7148" to-port="0" /> + <edge from-layer="7147" from-port="2" to-layer="7149" to-port="0" /> + <edge from-layer="7147" from-port="2" to-layer="7159" to-port="0" /> + <edge from-layer="7147" from-port="2" to-layer="7165" to-port="0" /> + <edge from-layer="7148" from-port="2" to-layer="7168" to-port="0" /> + <edge from-layer="7149" from-port="1" to-layer="7151" to-port="0" /> + <edge from-layer="7150" from-port="0" to-layer="7151" to-port="2" /> + <edge from-layer="7151" from-port="3" to-layer="7152" to-port="0" /> + <edge from-layer="7152" from-port="2" to-layer="7153" to-port="0" /> + <edge from-layer="7153" from-port="1" to-layer="7155" to-port="0" /> + <edge from-layer="7154" from-port="0" to-layer="7155" to-port="1" /> + <edge from-layer="7155" from-port="2" to-layer="7159" to-port="1" /> + <edge from-layer="7155" from-port="2" to-layer="7165" to-port="2" /> + <edge from-layer="7156" from-port="0" to-layer="7159" to-port="2" /> + <edge from-layer="7157" from-port="0" to-layer="7159" to-port="3" /> + <edge from-layer="7158" from-port="0" to-layer="7159" to-port="4" /> + <edge from-layer="7159" from-port="5" to-layer="7161" to-port="0" /> + <edge from-layer="7160" from-port="0" to-layer="7161" to-port="1" /> + <edge from-layer="7161" from-port="2" to-layer="7166" to-port="0" /> + <edge from-layer="7162" from-port="0" to-layer="7165" to-port="1" /> + <edge from-layer="7163" from-port="0" to-layer="7165" to-port="3" /> + <edge from-layer="7164" from-port="0" to-layer="7165" to-port="4" /> + <edge from-layer="7165" from-port="5" to-layer="7166" to-port="1" /> + <edge from-layer="7166" from-port="2" to-layer="7167" to-port="0" /> + <edge from-layer="7167" from-port="2" to-layer="7168" to-port="1" /> + <edge from-layer="7168" from-port="2" to-layer="7285" to-port="0" /> + <edge from-layer="7169" from-port="0" to-layer="7174" to-port="0" /> + <edge from-layer="7170" from-port="0" to-layer="7173" to-port="1" /> + <edge from-layer="7171" from-port="0" to-layer="7173" to-port="2" /> + <edge from-layer="7172" from-port="0" to-layer="7173" to-port="3" /> + <edge from-layer="7173" from-port="4" to-layer="7174" to-port="1" /> + <edge from-layer="7174" from-port="2" to-layer="7175" to-port="0" /> + <edge from-layer="7175" from-port="1" to-layer="7177" to-port="0" /> + <edge from-layer="7176" from-port="0" to-layer="7177" to-port="2" /> + <edge from-layer="7177" from-port="3" to-layer="7273" to-port="0" /> + <edge from-layer="7177" from-port="3" to-layer="7217" to-port="0" /> + <edge from-layer="7178" from-port="0" to-layer="7179" to-port="0" /> + <edge from-layer="7179" from-port="1" to-layer="7182" to-port="0" /> + <edge from-layer="7180" from-port="0" to-layer="7181" to-port="0" /> + <edge from-layer="7181" from-port="1" to-layer="7182" to-port="1" /> + <edge from-layer="7182" from-port="2" to-layer="7184" to-port="0" /> + <edge from-layer="7183" from-port="0" to-layer="7184" to-port="1" /> + <edge from-layer="7184" from-port="2" to-layer="7186" to-port="0" /> + <edge from-layer="7185" from-port="0" to-layer="7186" to-port="1" /> + <edge from-layer="7186" from-port="2" to-layer="7187" to-port="0" /> + <edge from-layer="7187" from-port="1" to-layer="7188" to-port="1" /> + <edge from-layer="7188" from-port="2" to-layer="7191" to-port="0" /> + <edge from-layer="7189" from-port="0" to-layer="7190" to-port="0" /> + <edge from-layer="7190" from-port="1" to-layer="7191" to-port="1" /> + <edge from-layer="7191" from-port="2" to-layer="7193" to-port="0" /> + <edge from-layer="7192" from-port="0" to-layer="7193" to-port="1" /> + <edge from-layer="7193" from-port="2" to-layer="7195" to-port="0" /> + <edge from-layer="7194" from-port="0" to-layer="7195" to-port="1" /> + <edge from-layer="7195" from-port="2" to-layer="7197" to-port="0" /> + <edge from-layer="7195" from-port="2" to-layer="7196" to-port="0" /> + <edge from-layer="7195" from-port="2" to-layer="7213" to-port="0" /> + <edge from-layer="7195" from-port="2" to-layer="7207" to-port="0" /> + <edge from-layer="7196" from-port="2" to-layer="7216" to-port="0" /> + <edge from-layer="7197" from-port="1" to-layer="7199" to-port="0" /> + <edge from-layer="7198" from-port="0" to-layer="7199" to-port="2" /> + <edge from-layer="7199" from-port="3" to-layer="7200" to-port="0" /> + <edge from-layer="7200" from-port="2" to-layer="7201" to-port="0" /> + <edge from-layer="7201" from-port="1" to-layer="7203" to-port="0" /> + <edge from-layer="7202" from-port="0" to-layer="7203" to-port="1" /> + <edge from-layer="7203" from-port="2" to-layer="7213" to-port="2" /> + <edge from-layer="7203" from-port="2" to-layer="7207" to-port="1" /> + <edge from-layer="7204" from-port="0" to-layer="7207" to-port="2" /> + <edge from-layer="7205" from-port="0" to-layer="7207" to-port="3" /> + <edge from-layer="7206" from-port="0" to-layer="7207" to-port="4" /> + <edge from-layer="7207" from-port="5" to-layer="7209" to-port="0" /> + <edge from-layer="7208" from-port="0" to-layer="7209" to-port="1" /> + <edge from-layer="7209" from-port="2" to-layer="7214" to-port="0" /> + <edge from-layer="7210" from-port="0" to-layer="7213" to-port="1" /> + <edge from-layer="7211" from-port="0" to-layer="7213" to-port="3" /> + <edge from-layer="7212" from-port="0" to-layer="7213" to-port="4" /> + <edge from-layer="7213" from-port="5" to-layer="7214" to-port="1" /> + <edge from-layer="7214" from-port="2" to-layer="7215" to-port="0" /> + <edge from-layer="7215" from-port="2" to-layer="7216" to-port="1" /> + <edge from-layer="7216" from-port="2" to-layer="7217" to-port="1" /> + <edge from-layer="7216" from-port="2" to-layer="7277" to-port="0" /> + <edge from-layer="7217" from-port="2" to-layer="7218" to-port="0" /> + <edge from-layer="7217" from-port="2" to-layer="7219" to-port="0" /> + <edge from-layer="7217" from-port="2" to-layer="11178" to-port="0" /> + <edge from-layer="7218" from-port="2" to-layer="7228" to-port="0" /> + <edge from-layer="7219" from-port="1" to-layer="7222" to-port="0" /> + <edge from-layer="7219" from-port="1" to-layer="7226" to-port="0" /> + <edge from-layer="7220" from-port="0" to-layer="7222" to-port="1" /> + <edge from-layer="7221" from-port="0" to-layer="7222" to-port="2" /> + <edge from-layer="7222" from-port="3" to-layer="7227" to-port="0" /> + <edge from-layer="7223" from-port="0" to-layer="7227" to-port="1" /> + <edge from-layer="7224" from-port="0" to-layer="7226" to-port="1" /> + <edge from-layer="7225" from-port="0" to-layer="7226" to-port="2" /> + <edge from-layer="7226" from-port="3" to-layer="7227" to-port="2" /> + <edge from-layer="7227" from-port="3" to-layer="7228" to-port="1" /> + <edge from-layer="7228" from-port="2" to-layer="7230" to-port="0" /> + <edge from-layer="7229" from-port="0" to-layer="7230" to-port="1" /> + <edge from-layer="7230" from-port="2" to-layer="7285" to-port="1" /> + <edge from-layer="7231" from-port="0" to-layer="7236" to-port="0" /> + <edge from-layer="7232" from-port="0" to-layer="7235" to-port="1" /> + <edge from-layer="7233" from-port="0" to-layer="7235" to-port="2" /> + <edge from-layer="7234" from-port="0" to-layer="7235" to-port="3" /> + <edge from-layer="7235" from-port="4" to-layer="7236" to-port="1" /> + <edge from-layer="7236" from-port="2" to-layer="7237" to-port="0" /> + <edge from-layer="7237" from-port="1" to-layer="7239" to-port="0" /> + <edge from-layer="7238" from-port="0" to-layer="7239" to-port="2" /> + <edge from-layer="7239" from-port="3" to-layer="7258" to-port="0" /> + <edge from-layer="7240" from-port="0" to-layer="7241" to-port="0" /> + <edge from-layer="7241" from-port="1" to-layer="7244" to-port="0" /> + <edge from-layer="7242" from-port="0" to-layer="7243" to-port="0" /> + <edge from-layer="7243" from-port="1" to-layer="7244" to-port="1" /> + <edge from-layer="7244" from-port="2" to-layer="7246" to-port="0" /> + <edge from-layer="7245" from-port="0" to-layer="7246" to-port="1" /> + <edge from-layer="7246" from-port="2" to-layer="7248" to-port="0" /> + <edge from-layer="7247" from-port="0" to-layer="7248" to-port="1" /> + <edge from-layer="7248" from-port="2" to-layer="7249" to-port="0" /> + <edge from-layer="7249" from-port="1" to-layer="7250" to-port="1" /> + <edge from-layer="7250" from-port="2" to-layer="7253" to-port="0" /> + <edge from-layer="7251" from-port="0" to-layer="7252" to-port="0" /> + <edge from-layer="7252" from-port="1" to-layer="7253" to-port="1" /> + <edge from-layer="7253" from-port="2" to-layer="7255" to-port="0" /> + <edge from-layer="7254" from-port="0" to-layer="7255" to-port="1" /> + <edge from-layer="7255" from-port="2" to-layer="7257" to-port="0" /> + <edge from-layer="7256" from-port="0" to-layer="7257" to-port="1" /> + <edge from-layer="7257" from-port="2" to-layer="7258" to-port="1" /> + <edge from-layer="7258" from-port="2" to-layer="11177" to-port="0" /> + <edge from-layer="7258" from-port="2" to-layer="7259" to-port="0" /> + <edge from-layer="7258" from-port="2" to-layer="7260" to-port="0" /> + <edge from-layer="7259" from-port="2" to-layer="7269" to-port="0" /> + <edge from-layer="7260" from-port="1" to-layer="7263" to-port="0" /> + <edge from-layer="7260" from-port="1" to-layer="7267" to-port="0" /> + <edge from-layer="7261" from-port="0" to-layer="7263" to-port="1" /> + <edge from-layer="7262" from-port="0" to-layer="7263" to-port="2" /> + <edge from-layer="7263" from-port="3" to-layer="7268" to-port="1" /> + <edge from-layer="7264" from-port="0" to-layer="7268" to-port="2" /> + <edge from-layer="7265" from-port="0" to-layer="7267" to-port="1" /> + <edge from-layer="7266" from-port="0" to-layer="7267" to-port="2" /> + <edge from-layer="7267" from-port="3" to-layer="7268" to-port="3" /> + <edge from-layer="7268" from-port="4" to-layer="7269" to-port="1" /> + <edge from-layer="7269" from-port="2" to-layer="7271" to-port="0" /> + <edge from-layer="7270" from-port="0" to-layer="7271" to-port="1" /> + <edge from-layer="7271" from-port="2" to-layer="7285" to-port="2" /> + <edge from-layer="7272" from-port="0" to-layer="7284" to-port="1" /> + <edge from-layer="7273" from-port="1" to-layer="7276" to-port="0" /> + <edge from-layer="7274" from-port="0" to-layer="7276" to-port="1" /> + <edge from-layer="7275" from-port="0" to-layer="7276" to-port="2" /> + <edge from-layer="7276" from-port="3" to-layer="7281" to-port="0" /> + <edge from-layer="7277" from-port="1" to-layer="7280" to-port="0" /> + <edge from-layer="7278" from-port="0" to-layer="7280" to-port="1" /> + <edge from-layer="7279" from-port="0" to-layer="7280" to-port="2" /> + <edge from-layer="7280" from-port="3" to-layer="7281" to-port="1" /> + <edge from-layer="7281" from-port="2" to-layer="7284" to-port="2" /> + <edge from-layer="7282" from-port="0" to-layer="7284" to-port="3" /> + <edge from-layer="7283" from-port="0" to-layer="7284" to-port="4" /> + <edge from-layer="7284" from-port="5" to-layer="7285" to-port="3" /> + <edge from-layer="7285" from-port="4" to-layer="7287" to-port="0" /> + <edge from-layer="7286" from-port="0" to-layer="7287" to-port="1" /> + <edge from-layer="7287" from-port="2" to-layer="7289" to-port="0" /> + <edge from-layer="7288" from-port="0" to-layer="7289" to-port="1" /> + <edge from-layer="7289" from-port="2" to-layer="7300" to-port="0" /> + <edge from-layer="7290" from-port="0" to-layer="7291" to-port="0" /> + <edge from-layer="7291" from-port="1" to-layer="7294" to-port="0" /> + <edge from-layer="7292" from-port="0" to-layer="7293" to-port="0" /> + <edge from-layer="7293" from-port="1" to-layer="7294" to-port="1" /> + <edge from-layer="7294" from-port="2" to-layer="7296" to-port="0" /> + <edge from-layer="7295" from-port="0" to-layer="7296" to-port="1" /> + <edge from-layer="7296" from-port="2" to-layer="7298" to-port="0" /> + <edge from-layer="7297" from-port="0" to-layer="7298" to-port="1" /> + <edge from-layer="7298" from-port="2" to-layer="7299" to-port="0" /> + <edge from-layer="7299" from-port="1" to-layer="7300" to-port="1" /> + <edge from-layer="7300" from-port="2" to-layer="7301" to-port="1" /> + <edge from-layer="7301" from-port="2" to-layer="7312" to-port="0" /> + <edge from-layer="7301" from-port="2" to-layer="7349" to-port="0" /> + <edge from-layer="7301" from-port="2" to-layer="7305" to-port="0" /> + <edge from-layer="7302" from-port="0" to-layer="7313" to-port="0" /> + <edge from-layer="7303" from-port="0" to-layer="7311" to-port="0" /> + <edge from-layer="7304" from-port="0" to-layer="7305" to-port="1" /> + <edge from-layer="7305" from-port="2" to-layer="7307" to-port="0" /> + <edge from-layer="7306" from-port="0" to-layer="7307" to-port="1" /> + <edge from-layer="7307" from-port="2" to-layer="7309" to-port="0" /> + <edge from-layer="7308" from-port="0" to-layer="7309" to-port="1" /> + <edge from-layer="7309" from-port="2" to-layer="7310" to-port="0" /> + <edge from-layer="7310" from-port="1" to-layer="7311" to-port="1" /> + <edge from-layer="7311" from-port="2" to-layer="7312" to-port="1" /> + <edge from-layer="7312" from-port="2" to-layer="7313" to-port="1" /> + <edge from-layer="7313" from-port="2" to-layer="7324" to-port="0" /> + <edge from-layer="7313" from-port="2" to-layer="7336" to-port="0" /> + <edge from-layer="7314" from-port="0" to-layer="7315" to-port="0" /> + <edge from-layer="7315" from-port="1" to-layer="7318" to-port="0" /> + <edge from-layer="7316" from-port="0" to-layer="7317" to-port="0" /> + <edge from-layer="7317" from-port="1" to-layer="7318" to-port="1" /> + <edge from-layer="7318" from-port="2" to-layer="7320" to-port="0" /> + <edge from-layer="7319" from-port="0" to-layer="7320" to-port="1" /> + <edge from-layer="7320" from-port="2" to-layer="7322" to-port="0" /> + <edge from-layer="7321" from-port="0" to-layer="7322" to-port="1" /> + <edge from-layer="7322" from-port="2" to-layer="7323" to-port="0" /> + <edge from-layer="7323" from-port="1" to-layer="7324" to-port="1" /> + <edge from-layer="7324" from-port="2" to-layer="7325" to-port="0" /> + <edge from-layer="7325" from-port="1" to-layer="7337" to-port="0" /> + <edge from-layer="7326" from-port="0" to-layer="7327" to-port="0" /> + <edge from-layer="7327" from-port="1" to-layer="7330" to-port="0" /> + <edge from-layer="7328" from-port="0" to-layer="7329" to-port="0" /> + <edge from-layer="7329" from-port="1" to-layer="7330" to-port="1" /> + <edge from-layer="7330" from-port="2" to-layer="7332" to-port="0" /> + <edge from-layer="7331" from-port="0" to-layer="7332" to-port="1" /> + <edge from-layer="7332" from-port="2" to-layer="7334" to-port="0" /> + <edge from-layer="7333" from-port="0" to-layer="7334" to-port="1" /> + <edge from-layer="7334" from-port="2" to-layer="7335" to-port="0" /> + <edge from-layer="7335" from-port="1" to-layer="7336" to-port="1" /> + <edge from-layer="7336" from-port="2" to-layer="7337" to-port="1" /> + <edge from-layer="7337" from-port="2" to-layer="7348" to-port="0" /> + <edge from-layer="7338" from-port="0" to-layer="7339" to-port="0" /> + <edge from-layer="7339" from-port="1" to-layer="7342" to-port="0" /> + <edge from-layer="7340" from-port="0" to-layer="7341" to-port="0" /> + <edge from-layer="7341" from-port="1" to-layer="7342" to-port="1" /> + <edge from-layer="7342" from-port="2" to-layer="7344" to-port="0" /> + <edge from-layer="7343" from-port="0" to-layer="7344" to-port="1" /> + <edge from-layer="7344" from-port="2" to-layer="7346" to-port="0" /> + <edge from-layer="7345" from-port="0" to-layer="7346" to-port="1" /> + <edge from-layer="7346" from-port="2" to-layer="7347" to-port="0" /> + <edge from-layer="7347" from-port="1" to-layer="7348" to-port="1" /> + <edge from-layer="7348" from-port="2" to-layer="7349" to-port="1" /> + <edge from-layer="7349" from-port="2" to-layer="7353" to-port="0" /> + <edge from-layer="7349" from-port="2" to-layer="7360" to-port="0" /> + <edge from-layer="7349" from-port="2" to-layer="7533" to-port="0" /> + <edge from-layer="7350" from-port="0" to-layer="7361" to-port="0" /> + <edge from-layer="7351" from-port="0" to-layer="7359" to-port="0" /> + <edge from-layer="7352" from-port="0" to-layer="7353" to-port="1" /> + <edge from-layer="7353" from-port="2" to-layer="7355" to-port="0" /> + <edge from-layer="7354" from-port="0" to-layer="7355" to-port="1" /> + <edge from-layer="7355" from-port="2" to-layer="7357" to-port="0" /> + <edge from-layer="7356" from-port="0" to-layer="7357" to-port="1" /> + <edge from-layer="7357" from-port="2" to-layer="7358" to-port="0" /> + <edge from-layer="7358" from-port="1" to-layer="7359" to-port="1" /> + <edge from-layer="7359" from-port="2" to-layer="7360" to-port="1" /> + <edge from-layer="7360" from-port="2" to-layer="7361" to-port="1" /> + <edge from-layer="7361" from-port="2" to-layer="7372" to-port="0" /> + <edge from-layer="7361" from-port="2" to-layer="7420" to-port="0" /> + <edge from-layer="7361" from-port="2" to-layer="7482" to-port="0" /> + <edge from-layer="7362" from-port="0" to-layer="7363" to-port="0" /> + <edge from-layer="7363" from-port="1" to-layer="7366" to-port="0" /> + <edge from-layer="7364" from-port="0" to-layer="7365" to-port="0" /> + <edge from-layer="7365" from-port="1" to-layer="7366" to-port="1" /> + <edge from-layer="7366" from-port="2" to-layer="7368" to-port="0" /> + <edge from-layer="7367" from-port="0" to-layer="7368" to-port="1" /> + <edge from-layer="7368" from-port="2" to-layer="7370" to-port="0" /> + <edge from-layer="7369" from-port="0" to-layer="7370" to-port="1" /> + <edge from-layer="7370" from-port="2" to-layer="7371" to-port="0" /> + <edge from-layer="7371" from-port="1" to-layer="7372" to-port="1" /> + <edge from-layer="7372" from-port="2" to-layer="7375" to-port="0" /> + <edge from-layer="7373" from-port="0" to-layer="7374" to-port="0" /> + <edge from-layer="7374" from-port="1" to-layer="7375" to-port="1" /> + <edge from-layer="7375" from-port="2" to-layer="7377" to-port="0" /> + <edge from-layer="7376" from-port="0" to-layer="7377" to-port="1" /> + <edge from-layer="7377" from-port="2" to-layer="7379" to-port="0" /> + <edge from-layer="7378" from-port="0" to-layer="7379" to-port="1" /> + <edge from-layer="7379" from-port="2" to-layer="7391" to-port="0" /> + <edge from-layer="7379" from-port="2" to-layer="7397" to-port="0" /> + <edge from-layer="7379" from-port="2" to-layer="7381" to-port="0" /> + <edge from-layer="7379" from-port="2" to-layer="7380" to-port="0" /> + <edge from-layer="7380" from-port="2" to-layer="7400" to-port="0" /> + <edge from-layer="7381" from-port="1" to-layer="7383" to-port="0" /> + <edge from-layer="7382" from-port="0" to-layer="7383" to-port="2" /> + <edge from-layer="7383" from-port="3" to-layer="7384" to-port="0" /> + <edge from-layer="7384" from-port="2" to-layer="7385" to-port="0" /> + <edge from-layer="7385" from-port="1" to-layer="7387" to-port="0" /> + <edge from-layer="7386" from-port="0" to-layer="7387" to-port="1" /> + <edge from-layer="7387" from-port="2" to-layer="7397" to-port="2" /> + <edge from-layer="7387" from-port="2" to-layer="7391" to-port="1" /> + <edge from-layer="7388" from-port="0" to-layer="7391" to-port="2" /> + <edge from-layer="7389" from-port="0" to-layer="7391" to-port="3" /> + <edge from-layer="7390" from-port="0" to-layer="7391" to-port="4" /> + <edge from-layer="7391" from-port="5" to-layer="7393" to-port="0" /> + <edge from-layer="7392" from-port="0" to-layer="7393" to-port="1" /> + <edge from-layer="7393" from-port="2" to-layer="7398" to-port="0" /> + <edge from-layer="7394" from-port="0" to-layer="7397" to-port="1" /> + <edge from-layer="7395" from-port="0" to-layer="7397" to-port="3" /> + <edge from-layer="7396" from-port="0" to-layer="7397" to-port="4" /> + <edge from-layer="7397" from-port="5" to-layer="7398" to-port="1" /> + <edge from-layer="7398" from-port="2" to-layer="7399" to-port="0" /> + <edge from-layer="7399" from-port="2" to-layer="7400" to-port="1" /> + <edge from-layer="7400" from-port="2" to-layer="7517" to-port="0" /> + <edge from-layer="7401" from-port="0" to-layer="7406" to-port="0" /> + <edge from-layer="7402" from-port="0" to-layer="7405" to-port="1" /> + <edge from-layer="7403" from-port="0" to-layer="7405" to-port="2" /> + <edge from-layer="7404" from-port="0" to-layer="7405" to-port="3" /> + <edge from-layer="7405" from-port="4" to-layer="7406" to-port="1" /> + <edge from-layer="7406" from-port="2" to-layer="7407" to-port="0" /> + <edge from-layer="7407" from-port="1" to-layer="7409" to-port="0" /> + <edge from-layer="7408" from-port="0" to-layer="7409" to-port="2" /> + <edge from-layer="7409" from-port="3" to-layer="7505" to-port="0" /> + <edge from-layer="7409" from-port="3" to-layer="7449" to-port="0" /> + <edge from-layer="7410" from-port="0" to-layer="7411" to-port="0" /> + <edge from-layer="7411" from-port="1" to-layer="7414" to-port="0" /> + <edge from-layer="7412" from-port="0" to-layer="7413" to-port="0" /> + <edge from-layer="7413" from-port="1" to-layer="7414" to-port="1" /> + <edge from-layer="7414" from-port="2" to-layer="7416" to-port="0" /> + <edge from-layer="7415" from-port="0" to-layer="7416" to-port="1" /> + <edge from-layer="7416" from-port="2" to-layer="7418" to-port="0" /> + <edge from-layer="7417" from-port="0" to-layer="7418" to-port="1" /> + <edge from-layer="7418" from-port="2" to-layer="7419" to-port="0" /> + <edge from-layer="7419" from-port="1" to-layer="7420" to-port="1" /> + <edge from-layer="7420" from-port="2" to-layer="7423" to-port="0" /> + <edge from-layer="7421" from-port="0" to-layer="7422" to-port="0" /> + <edge from-layer="7422" from-port="1" to-layer="7423" to-port="1" /> + <edge from-layer="7423" from-port="2" to-layer="7425" to-port="0" /> + <edge from-layer="7424" from-port="0" to-layer="7425" to-port="1" /> + <edge from-layer="7425" from-port="2" to-layer="7427" to-port="0" /> + <edge from-layer="7426" from-port="0" to-layer="7427" to-port="1" /> + <edge from-layer="7427" from-port="2" to-layer="7445" to-port="0" /> + <edge from-layer="7427" from-port="2" to-layer="7439" to-port="0" /> + <edge from-layer="7427" from-port="2" to-layer="7428" to-port="0" /> + <edge from-layer="7427" from-port="2" to-layer="7429" to-port="0" /> + <edge from-layer="7428" from-port="2" to-layer="7448" to-port="0" /> + <edge from-layer="7429" from-port="1" to-layer="7431" to-port="0" /> + <edge from-layer="7430" from-port="0" to-layer="7431" to-port="2" /> + <edge from-layer="7431" from-port="3" to-layer="7432" to-port="0" /> + <edge from-layer="7432" from-port="2" to-layer="7433" to-port="0" /> + <edge from-layer="7433" from-port="1" to-layer="7435" to-port="0" /> + <edge from-layer="7434" from-port="0" to-layer="7435" to-port="1" /> + <edge from-layer="7435" from-port="2" to-layer="7439" to-port="1" /> + <edge from-layer="7435" from-port="2" to-layer="7445" to-port="2" /> + <edge from-layer="7436" from-port="0" to-layer="7439" to-port="2" /> + <edge from-layer="7437" from-port="0" to-layer="7439" to-port="3" /> + <edge from-layer="7438" from-port="0" to-layer="7439" to-port="4" /> + <edge from-layer="7439" from-port="5" to-layer="7441" to-port="0" /> + <edge from-layer="7440" from-port="0" to-layer="7441" to-port="1" /> + <edge from-layer="7441" from-port="2" to-layer="7446" to-port="0" /> + <edge from-layer="7442" from-port="0" to-layer="7445" to-port="1" /> + <edge from-layer="7443" from-port="0" to-layer="7445" to-port="3" /> + <edge from-layer="7444" from-port="0" to-layer="7445" to-port="4" /> + <edge from-layer="7445" from-port="5" to-layer="7446" to-port="1" /> + <edge from-layer="7446" from-port="2" to-layer="7447" to-port="0" /> + <edge from-layer="7447" from-port="2" to-layer="7448" to-port="1" /> + <edge from-layer="7448" from-port="2" to-layer="7449" to-port="1" /> + <edge from-layer="7448" from-port="2" to-layer="7509" to-port="0" /> + <edge from-layer="7449" from-port="2" to-layer="11176" to-port="0" /> + <edge from-layer="7449" from-port="2" to-layer="7450" to-port="0" /> + <edge from-layer="7449" from-port="2" to-layer="7451" to-port="0" /> + <edge from-layer="7450" from-port="2" to-layer="7460" to-port="0" /> + <edge from-layer="7451" from-port="1" to-layer="7454" to-port="0" /> + <edge from-layer="7451" from-port="1" to-layer="7458" to-port="0" /> + <edge from-layer="7452" from-port="0" to-layer="7454" to-port="1" /> + <edge from-layer="7453" from-port="0" to-layer="7454" to-port="2" /> + <edge from-layer="7454" from-port="3" to-layer="7459" to-port="0" /> + <edge from-layer="7455" from-port="0" to-layer="7459" to-port="1" /> + <edge from-layer="7456" from-port="0" to-layer="7458" to-port="1" /> + <edge from-layer="7457" from-port="0" to-layer="7458" to-port="2" /> + <edge from-layer="7458" from-port="3" to-layer="7459" to-port="2" /> + <edge from-layer="7459" from-port="3" to-layer="7460" to-port="1" /> + <edge from-layer="7460" from-port="2" to-layer="7462" to-port="0" /> + <edge from-layer="7461" from-port="0" to-layer="7462" to-port="1" /> + <edge from-layer="7462" from-port="2" to-layer="7517" to-port="1" /> + <edge from-layer="7463" from-port="0" to-layer="7468" to-port="0" /> + <edge from-layer="7464" from-port="0" to-layer="7467" to-port="1" /> + <edge from-layer="7465" from-port="0" to-layer="7467" to-port="2" /> + <edge from-layer="7466" from-port="0" to-layer="7467" to-port="3" /> + <edge from-layer="7467" from-port="4" to-layer="7468" to-port="1" /> + <edge from-layer="7468" from-port="2" to-layer="7469" to-port="0" /> + <edge from-layer="7469" from-port="1" to-layer="7471" to-port="0" /> + <edge from-layer="7470" from-port="0" to-layer="7471" to-port="2" /> + <edge from-layer="7471" from-port="3" to-layer="7490" to-port="0" /> + <edge from-layer="7472" from-port="0" to-layer="7473" to-port="0" /> + <edge from-layer="7473" from-port="1" to-layer="7476" to-port="0" /> + <edge from-layer="7474" from-port="0" to-layer="7475" to-port="0" /> + <edge from-layer="7475" from-port="1" to-layer="7476" to-port="1" /> + <edge from-layer="7476" from-port="2" to-layer="7478" to-port="0" /> + <edge from-layer="7477" from-port="0" to-layer="7478" to-port="1" /> + <edge from-layer="7478" from-port="2" to-layer="7480" to-port="0" /> + <edge from-layer="7479" from-port="0" to-layer="7480" to-port="1" /> + <edge from-layer="7480" from-port="2" to-layer="7481" to-port="0" /> + <edge from-layer="7481" from-port="1" to-layer="7482" to-port="1" /> + <edge from-layer="7482" from-port="2" to-layer="7485" to-port="0" /> + <edge from-layer="7483" from-port="0" to-layer="7484" to-port="0" /> + <edge from-layer="7484" from-port="1" to-layer="7485" to-port="1" /> + <edge from-layer="7485" from-port="2" to-layer="7487" to-port="0" /> + <edge from-layer="7486" from-port="0" to-layer="7487" to-port="1" /> + <edge from-layer="7487" from-port="2" to-layer="7489" to-port="0" /> + <edge from-layer="7488" from-port="0" to-layer="7489" to-port="1" /> + <edge from-layer="7489" from-port="2" to-layer="7490" to-port="1" /> + <edge from-layer="7490" from-port="2" to-layer="7491" to-port="0" /> + <edge from-layer="7490" from-port="2" to-layer="7492" to-port="0" /> + <edge from-layer="7490" from-port="2" to-layer="11175" to-port="0" /> + <edge from-layer="7491" from-port="2" to-layer="7501" to-port="0" /> + <edge from-layer="7492" from-port="1" to-layer="7495" to-port="0" /> + <edge from-layer="7492" from-port="1" to-layer="7499" to-port="0" /> + <edge from-layer="7493" from-port="0" to-layer="7495" to-port="1" /> + <edge from-layer="7494" from-port="0" to-layer="7495" to-port="2" /> + <edge from-layer="7495" from-port="3" to-layer="7500" to-port="1" /> + <edge from-layer="7496" from-port="0" to-layer="7500" to-port="2" /> + <edge from-layer="7497" from-port="0" to-layer="7499" to-port="1" /> + <edge from-layer="7498" from-port="0" to-layer="7499" to-port="2" /> + <edge from-layer="7499" from-port="3" to-layer="7500" to-port="3" /> + <edge from-layer="7500" from-port="4" to-layer="7501" to-port="1" /> + <edge from-layer="7501" from-port="2" to-layer="7503" to-port="0" /> + <edge from-layer="7502" from-port="0" to-layer="7503" to-port="1" /> + <edge from-layer="7503" from-port="2" to-layer="7517" to-port="2" /> + <edge from-layer="7504" from-port="0" to-layer="7516" to-port="1" /> + <edge from-layer="7505" from-port="1" to-layer="7508" to-port="0" /> + <edge from-layer="7506" from-port="0" to-layer="7508" to-port="1" /> + <edge from-layer="7507" from-port="0" to-layer="7508" to-port="2" /> + <edge from-layer="7508" from-port="3" to-layer="7513" to-port="0" /> + <edge from-layer="7509" from-port="1" to-layer="7512" to-port="0" /> + <edge from-layer="7510" from-port="0" to-layer="7512" to-port="1" /> + <edge from-layer="7511" from-port="0" to-layer="7512" to-port="2" /> + <edge from-layer="7512" from-port="3" to-layer="7513" to-port="1" /> + <edge from-layer="7513" from-port="2" to-layer="7516" to-port="2" /> + <edge from-layer="7514" from-port="0" to-layer="7516" to-port="3" /> + <edge from-layer="7515" from-port="0" to-layer="7516" to-port="4" /> + <edge from-layer="7516" from-port="5" to-layer="7517" to-port="3" /> + <edge from-layer="7517" from-port="4" to-layer="7519" to-port="0" /> + <edge from-layer="7518" from-port="0" to-layer="7519" to-port="1" /> + <edge from-layer="7519" from-port="2" to-layer="7521" to-port="0" /> + <edge from-layer="7520" from-port="0" to-layer="7521" to-port="1" /> + <edge from-layer="7521" from-port="2" to-layer="7532" to-port="0" /> + <edge from-layer="7522" from-port="0" to-layer="7523" to-port="0" /> + <edge from-layer="7523" from-port="1" to-layer="7526" to-port="0" /> + <edge from-layer="7524" from-port="0" to-layer="7525" to-port="0" /> + <edge from-layer="7525" from-port="1" to-layer="7526" to-port="1" /> + <edge from-layer="7526" from-port="2" to-layer="7528" to-port="0" /> + <edge from-layer="7527" from-port="0" to-layer="7528" to-port="1" /> + <edge from-layer="7528" from-port="2" to-layer="7530" to-port="0" /> + <edge from-layer="7529" from-port="0" to-layer="7530" to-port="1" /> + <edge from-layer="7530" from-port="2" to-layer="7531" to-port="0" /> + <edge from-layer="7531" from-port="1" to-layer="7532" to-port="1" /> + <edge from-layer="7532" from-port="2" to-layer="7533" to-port="1" /> + <edge from-layer="7533" from-port="2" to-layer="7537" to-port="0" /> + <edge from-layer="7533" from-port="2" to-layer="7544" to-port="0" /> + <edge from-layer="7533" from-port="2" to-layer="7581" to-port="0" /> + <edge from-layer="7534" from-port="0" to-layer="7545" to-port="0" /> + <edge from-layer="7535" from-port="0" to-layer="7543" to-port="0" /> + <edge from-layer="7536" from-port="0" to-layer="7537" to-port="1" /> + <edge from-layer="7537" from-port="2" to-layer="7539" to-port="0" /> + <edge from-layer="7538" from-port="0" to-layer="7539" to-port="1" /> + <edge from-layer="7539" from-port="2" to-layer="7541" to-port="0" /> + <edge from-layer="7540" from-port="0" to-layer="7541" to-port="1" /> + <edge from-layer="7541" from-port="2" to-layer="7542" to-port="0" /> + <edge from-layer="7542" from-port="1" to-layer="7543" to-port="1" /> + <edge from-layer="7543" from-port="2" to-layer="7544" to-port="1" /> + <edge from-layer="7544" from-port="2" to-layer="7545" to-port="1" /> + <edge from-layer="7545" from-port="2" to-layer="7556" to-port="0" /> + <edge from-layer="7545" from-port="2" to-layer="7568" to-port="0" /> + <edge from-layer="7546" from-port="0" to-layer="7547" to-port="0" /> + <edge from-layer="7547" from-port="1" to-layer="7550" to-port="0" /> + <edge from-layer="7548" from-port="0" to-layer="7549" to-port="0" /> + <edge from-layer="7549" from-port="1" to-layer="7550" to-port="1" /> + <edge from-layer="7550" from-port="2" to-layer="7552" to-port="0" /> + <edge from-layer="7551" from-port="0" to-layer="7552" to-port="1" /> + <edge from-layer="7552" from-port="2" to-layer="7554" to-port="0" /> + <edge from-layer="7553" from-port="0" to-layer="7554" to-port="1" /> + <edge from-layer="7554" from-port="2" to-layer="7555" to-port="0" /> + <edge from-layer="7555" from-port="1" to-layer="7556" to-port="1" /> + <edge from-layer="7556" from-port="2" to-layer="7557" to-port="0" /> + <edge from-layer="7557" from-port="1" to-layer="7569" to-port="0" /> + <edge from-layer="7558" from-port="0" to-layer="7559" to-port="0" /> + <edge from-layer="7559" from-port="1" to-layer="7562" to-port="0" /> + <edge from-layer="7560" from-port="0" to-layer="7561" to-port="0" /> + <edge from-layer="7561" from-port="1" to-layer="7562" to-port="1" /> + <edge from-layer="7562" from-port="2" to-layer="7564" to-port="0" /> + <edge from-layer="7563" from-port="0" to-layer="7564" to-port="1" /> + <edge from-layer="7564" from-port="2" to-layer="7566" to-port="0" /> + <edge from-layer="7565" from-port="0" to-layer="7566" to-port="1" /> + <edge from-layer="7566" from-port="2" to-layer="7567" to-port="0" /> + <edge from-layer="7567" from-port="1" to-layer="7568" to-port="1" /> + <edge from-layer="7568" from-port="2" to-layer="7569" to-port="1" /> + <edge from-layer="7569" from-port="2" to-layer="7580" to-port="0" /> + <edge from-layer="7570" from-port="0" to-layer="7571" to-port="0" /> + <edge from-layer="7571" from-port="1" to-layer="7574" to-port="0" /> + <edge from-layer="7572" from-port="0" to-layer="7573" to-port="0" /> + <edge from-layer="7573" from-port="1" to-layer="7574" to-port="1" /> + <edge from-layer="7574" from-port="2" to-layer="7576" to-port="0" /> + <edge from-layer="7575" from-port="0" to-layer="7576" to-port="1" /> + <edge from-layer="7576" from-port="2" to-layer="7578" to-port="0" /> + <edge from-layer="7577" from-port="0" to-layer="7578" to-port="1" /> + <edge from-layer="7578" from-port="2" to-layer="7579" to-port="0" /> + <edge from-layer="7579" from-port="1" to-layer="7580" to-port="1" /> + <edge from-layer="7580" from-port="2" to-layer="7581" to-port="1" /> + <edge from-layer="7581" from-port="2" to-layer="7585" to-port="0" /> + <edge from-layer="7581" from-port="2" to-layer="7592" to-port="0" /> + <edge from-layer="7581" from-port="2" to-layer="7765" to-port="0" /> + <edge from-layer="7582" from-port="0" to-layer="7593" to-port="0" /> + <edge from-layer="7583" from-port="0" to-layer="7591" to-port="0" /> + <edge from-layer="7584" from-port="0" to-layer="7585" to-port="1" /> + <edge from-layer="7585" from-port="2" to-layer="7587" to-port="0" /> + <edge from-layer="7586" from-port="0" to-layer="7587" to-port="1" /> + <edge from-layer="7587" from-port="2" to-layer="7589" to-port="0" /> + <edge from-layer="7588" from-port="0" to-layer="7589" to-port="1" /> + <edge from-layer="7589" from-port="2" to-layer="7590" to-port="0" /> + <edge from-layer="7590" from-port="1" to-layer="7591" to-port="1" /> + <edge from-layer="7591" from-port="2" to-layer="7592" to-port="1" /> + <edge from-layer="7592" from-port="2" to-layer="7593" to-port="1" /> + <edge from-layer="7593" from-port="2" to-layer="7652" to-port="0" /> + <edge from-layer="7593" from-port="2" to-layer="7714" to-port="0" /> + <edge from-layer="7593" from-port="2" to-layer="7604" to-port="0" /> + <edge from-layer="7594" from-port="0" to-layer="7595" to-port="0" /> + <edge from-layer="7595" from-port="1" to-layer="7598" to-port="0" /> + <edge from-layer="7596" from-port="0" to-layer="7597" to-port="0" /> + <edge from-layer="7597" from-port="1" to-layer="7598" to-port="1" /> + <edge from-layer="7598" from-port="2" to-layer="7600" to-port="0" /> + <edge from-layer="7599" from-port="0" to-layer="7600" to-port="1" /> + <edge from-layer="7600" from-port="2" to-layer="7602" to-port="0" /> + <edge from-layer="7601" from-port="0" to-layer="7602" to-port="1" /> + <edge from-layer="7602" from-port="2" to-layer="7603" to-port="0" /> + <edge from-layer="7603" from-port="1" to-layer="7604" to-port="1" /> + <edge from-layer="7604" from-port="2" to-layer="7607" to-port="0" /> + <edge from-layer="7605" from-port="0" to-layer="7606" to-port="0" /> + <edge from-layer="7606" from-port="1" to-layer="7607" to-port="1" /> + <edge from-layer="7607" from-port="2" to-layer="7609" to-port="0" /> + <edge from-layer="7608" from-port="0" to-layer="7609" to-port="1" /> + <edge from-layer="7609" from-port="2" to-layer="7611" to-port="0" /> + <edge from-layer="7610" from-port="0" to-layer="7611" to-port="1" /> + <edge from-layer="7611" from-port="2" to-layer="7629" to-port="0" /> + <edge from-layer="7611" from-port="2" to-layer="7623" to-port="0" /> + <edge from-layer="7611" from-port="2" to-layer="7612" to-port="0" /> + <edge from-layer="7611" from-port="2" to-layer="7613" to-port="0" /> + <edge from-layer="7612" from-port="2" to-layer="7632" to-port="0" /> + <edge from-layer="7613" from-port="1" to-layer="7615" to-port="0" /> + <edge from-layer="7614" from-port="0" to-layer="7615" to-port="2" /> + <edge from-layer="7615" from-port="3" to-layer="7616" to-port="0" /> + <edge from-layer="7616" from-port="2" to-layer="7617" to-port="0" /> + <edge from-layer="7617" from-port="1" to-layer="7619" to-port="0" /> + <edge from-layer="7618" from-port="0" to-layer="7619" to-port="1" /> + <edge from-layer="7619" from-port="2" to-layer="7623" to-port="1" /> + <edge from-layer="7619" from-port="2" to-layer="7629" to-port="2" /> + <edge from-layer="7620" from-port="0" to-layer="7623" to-port="2" /> + <edge from-layer="7621" from-port="0" to-layer="7623" to-port="3" /> + <edge from-layer="7622" from-port="0" to-layer="7623" to-port="4" /> + <edge from-layer="7623" from-port="5" to-layer="7625" to-port="0" /> + <edge from-layer="7624" from-port="0" to-layer="7625" to-port="1" /> + <edge from-layer="7625" from-port="2" to-layer="7630" to-port="0" /> + <edge from-layer="7626" from-port="0" to-layer="7629" to-port="1" /> + <edge from-layer="7627" from-port="0" to-layer="7629" to-port="3" /> + <edge from-layer="7628" from-port="0" to-layer="7629" to-port="4" /> + <edge from-layer="7629" from-port="5" to-layer="7630" to-port="1" /> + <edge from-layer="7630" from-port="2" to-layer="7631" to-port="0" /> + <edge from-layer="7631" from-port="2" to-layer="7632" to-port="1" /> + <edge from-layer="7632" from-port="2" to-layer="7749" to-port="0" /> + <edge from-layer="7633" from-port="0" to-layer="7638" to-port="0" /> + <edge from-layer="7634" from-port="0" to-layer="7637" to-port="1" /> + <edge from-layer="7635" from-port="0" to-layer="7637" to-port="2" /> + <edge from-layer="7636" from-port="0" to-layer="7637" to-port="3" /> + <edge from-layer="7637" from-port="4" to-layer="7638" to-port="1" /> + <edge from-layer="7638" from-port="2" to-layer="7639" to-port="0" /> + <edge from-layer="7639" from-port="1" to-layer="7641" to-port="0" /> + <edge from-layer="7640" from-port="0" to-layer="7641" to-port="2" /> + <edge from-layer="7641" from-port="3" to-layer="7681" to-port="0" /> + <edge from-layer="7641" from-port="3" to-layer="7737" to-port="0" /> + <edge from-layer="7642" from-port="0" to-layer="7643" to-port="0" /> + <edge from-layer="7643" from-port="1" to-layer="7646" to-port="0" /> + <edge from-layer="7644" from-port="0" to-layer="7645" to-port="0" /> + <edge from-layer="7645" from-port="1" to-layer="7646" to-port="1" /> + <edge from-layer="7646" from-port="2" to-layer="7648" to-port="0" /> + <edge from-layer="7647" from-port="0" to-layer="7648" to-port="1" /> + <edge from-layer="7648" from-port="2" to-layer="7650" to-port="0" /> + <edge from-layer="7649" from-port="0" to-layer="7650" to-port="1" /> + <edge from-layer="7650" from-port="2" to-layer="7651" to-port="0" /> + <edge from-layer="7651" from-port="1" to-layer="7652" to-port="1" /> + <edge from-layer="7652" from-port="2" to-layer="7655" to-port="0" /> + <edge from-layer="7653" from-port="0" to-layer="7654" to-port="0" /> + <edge from-layer="7654" from-port="1" to-layer="7655" to-port="1" /> + <edge from-layer="7655" from-port="2" to-layer="7657" to-port="0" /> + <edge from-layer="7656" from-port="0" to-layer="7657" to-port="1" /> + <edge from-layer="7657" from-port="2" to-layer="7659" to-port="0" /> + <edge from-layer="7658" from-port="0" to-layer="7659" to-port="1" /> + <edge from-layer="7659" from-port="2" to-layer="7660" to-port="0" /> + <edge from-layer="7659" from-port="2" to-layer="7661" to-port="0" /> + <edge from-layer="7659" from-port="2" to-layer="7671" to-port="0" /> + <edge from-layer="7659" from-port="2" to-layer="7677" to-port="0" /> + <edge from-layer="7660" from-port="2" to-layer="7680" to-port="0" /> + <edge from-layer="7661" from-port="1" to-layer="7663" to-port="0" /> + <edge from-layer="7662" from-port="0" to-layer="7663" to-port="2" /> + <edge from-layer="7663" from-port="3" to-layer="7664" to-port="0" /> + <edge from-layer="7664" from-port="2" to-layer="7665" to-port="0" /> + <edge from-layer="7665" from-port="1" to-layer="7667" to-port="0" /> + <edge from-layer="7666" from-port="0" to-layer="7667" to-port="1" /> + <edge from-layer="7667" from-port="2" to-layer="7671" to-port="1" /> + <edge from-layer="7667" from-port="2" to-layer="7677" to-port="2" /> + <edge from-layer="7668" from-port="0" to-layer="7671" to-port="2" /> + <edge from-layer="7669" from-port="0" to-layer="7671" to-port="3" /> + <edge from-layer="7670" from-port="0" to-layer="7671" to-port="4" /> + <edge from-layer="7671" from-port="5" to-layer="7673" to-port="0" /> + <edge from-layer="7672" from-port="0" to-layer="7673" to-port="1" /> + <edge from-layer="7673" from-port="2" to-layer="7678" to-port="0" /> + <edge from-layer="7674" from-port="0" to-layer="7677" to-port="1" /> + <edge from-layer="7675" from-port="0" to-layer="7677" to-port="3" /> + <edge from-layer="7676" from-port="0" to-layer="7677" to-port="4" /> + <edge from-layer="7677" from-port="5" to-layer="7678" to-port="1" /> + <edge from-layer="7678" from-port="2" to-layer="7679" to-port="0" /> + <edge from-layer="7679" from-port="2" to-layer="7680" to-port="1" /> + <edge from-layer="7680" from-port="2" to-layer="7681" to-port="1" /> + <edge from-layer="7680" from-port="2" to-layer="7741" to-port="0" /> + <edge from-layer="7681" from-port="2" to-layer="7682" to-port="0" /> + <edge from-layer="7681" from-port="2" to-layer="7683" to-port="0" /> + <edge from-layer="7681" from-port="2" to-layer="11174" to-port="0" /> + <edge from-layer="7682" from-port="2" to-layer="7692" to-port="0" /> + <edge from-layer="7683" from-port="1" to-layer="7690" to-port="0" /> + <edge from-layer="7683" from-port="1" to-layer="7686" to-port="0" /> + <edge from-layer="7684" from-port="0" to-layer="7686" to-port="1" /> + <edge from-layer="7685" from-port="0" to-layer="7686" to-port="2" /> + <edge from-layer="7686" from-port="3" to-layer="7691" to-port="0" /> + <edge from-layer="7687" from-port="0" to-layer="7691" to-port="1" /> + <edge from-layer="7688" from-port="0" to-layer="7690" to-port="1" /> + <edge from-layer="7689" from-port="0" to-layer="7690" to-port="2" /> + <edge from-layer="7690" from-port="3" to-layer="7691" to-port="2" /> + <edge from-layer="7691" from-port="3" to-layer="7692" to-port="1" /> + <edge from-layer="7692" from-port="2" to-layer="7694" to-port="0" /> + <edge from-layer="7693" from-port="0" to-layer="7694" to-port="1" /> + <edge from-layer="7694" from-port="2" to-layer="7749" to-port="1" /> + <edge from-layer="7695" from-port="0" to-layer="7700" to-port="0" /> + <edge from-layer="7696" from-port="0" to-layer="7699" to-port="1" /> + <edge from-layer="7697" from-port="0" to-layer="7699" to-port="2" /> + <edge from-layer="7698" from-port="0" to-layer="7699" to-port="3" /> + <edge from-layer="7699" from-port="4" to-layer="7700" to-port="1" /> + <edge from-layer="7700" from-port="2" to-layer="7701" to-port="0" /> + <edge from-layer="7701" from-port="1" to-layer="7703" to-port="0" /> + <edge from-layer="7702" from-port="0" to-layer="7703" to-port="2" /> + <edge from-layer="7703" from-port="3" to-layer="7722" to-port="0" /> + <edge from-layer="7704" from-port="0" to-layer="7705" to-port="0" /> + <edge from-layer="7705" from-port="1" to-layer="7708" to-port="0" /> + <edge from-layer="7706" from-port="0" to-layer="7707" to-port="0" /> + <edge from-layer="7707" from-port="1" to-layer="7708" to-port="1" /> + <edge from-layer="7708" from-port="2" to-layer="7710" to-port="0" /> + <edge from-layer="7709" from-port="0" to-layer="7710" to-port="1" /> + <edge from-layer="7710" from-port="2" to-layer="7712" to-port="0" /> + <edge from-layer="7711" from-port="0" to-layer="7712" to-port="1" /> + <edge from-layer="7712" from-port="2" to-layer="7713" to-port="0" /> + <edge from-layer="7713" from-port="1" to-layer="7714" to-port="1" /> + <edge from-layer="7714" from-port="2" to-layer="7717" to-port="0" /> + <edge from-layer="7715" from-port="0" to-layer="7716" to-port="0" /> + <edge from-layer="7716" from-port="1" to-layer="7717" to-port="1" /> + <edge from-layer="7717" from-port="2" to-layer="7719" to-port="0" /> + <edge from-layer="7718" from-port="0" to-layer="7719" to-port="1" /> + <edge from-layer="7719" from-port="2" to-layer="7721" to-port="0" /> + <edge from-layer="7720" from-port="0" to-layer="7721" to-port="1" /> + <edge from-layer="7721" from-port="2" to-layer="7722" to-port="1" /> + <edge from-layer="7722" from-port="2" to-layer="11173" to-port="0" /> + <edge from-layer="7722" from-port="2" to-layer="7724" to-port="0" /> + <edge from-layer="7722" from-port="2" to-layer="7723" to-port="0" /> + <edge from-layer="7723" from-port="2" to-layer="7733" to-port="0" /> + <edge from-layer="7724" from-port="1" to-layer="7731" to-port="0" /> + <edge from-layer="7724" from-port="1" to-layer="7727" to-port="0" /> + <edge from-layer="7725" from-port="0" to-layer="7727" to-port="1" /> + <edge from-layer="7726" from-port="0" to-layer="7727" to-port="2" /> + <edge from-layer="7727" from-port="3" to-layer="7732" to-port="1" /> + <edge from-layer="7728" from-port="0" to-layer="7732" to-port="2" /> + <edge from-layer="7729" from-port="0" to-layer="7731" to-port="1" /> + <edge from-layer="7730" from-port="0" to-layer="7731" to-port="2" /> + <edge from-layer="7731" from-port="3" to-layer="7732" to-port="3" /> + <edge from-layer="7732" from-port="4" to-layer="7733" to-port="1" /> + <edge from-layer="7733" from-port="2" to-layer="7735" to-port="0" /> + <edge from-layer="7734" from-port="0" to-layer="7735" to-port="1" /> + <edge from-layer="7735" from-port="2" to-layer="7749" to-port="2" /> + <edge from-layer="7736" from-port="0" to-layer="7748" to-port="1" /> + <edge from-layer="7737" from-port="1" to-layer="7740" to-port="0" /> + <edge from-layer="7738" from-port="0" to-layer="7740" to-port="1" /> + <edge from-layer="7739" from-port="0" to-layer="7740" to-port="2" /> + <edge from-layer="7740" from-port="3" to-layer="7745" to-port="0" /> + <edge from-layer="7741" from-port="1" to-layer="7744" to-port="0" /> + <edge from-layer="7742" from-port="0" to-layer="7744" to-port="1" /> + <edge from-layer="7743" from-port="0" to-layer="7744" to-port="2" /> + <edge from-layer="7744" from-port="3" to-layer="7745" to-port="1" /> + <edge from-layer="7745" from-port="2" to-layer="7748" to-port="2" /> + <edge from-layer="7746" from-port="0" to-layer="7748" to-port="3" /> + <edge from-layer="7747" from-port="0" to-layer="7748" to-port="4" /> + <edge from-layer="7748" from-port="5" to-layer="7749" to-port="3" /> + <edge from-layer="7749" from-port="4" to-layer="7751" to-port="0" /> + <edge from-layer="7750" from-port="0" to-layer="7751" to-port="1" /> + <edge from-layer="7751" from-port="2" to-layer="7753" to-port="0" /> + <edge from-layer="7752" from-port="0" to-layer="7753" to-port="1" /> + <edge from-layer="7753" from-port="2" to-layer="7764" to-port="0" /> + <edge from-layer="7754" from-port="0" to-layer="7755" to-port="0" /> + <edge from-layer="7755" from-port="1" to-layer="7758" to-port="0" /> + <edge from-layer="7756" from-port="0" to-layer="7757" to-port="0" /> + <edge from-layer="7757" from-port="1" to-layer="7758" to-port="1" /> + <edge from-layer="7758" from-port="2" to-layer="7760" to-port="0" /> + <edge from-layer="7759" from-port="0" to-layer="7760" to-port="1" /> + <edge from-layer="7760" from-port="2" to-layer="7762" to-port="0" /> + <edge from-layer="7761" from-port="0" to-layer="7762" to-port="1" /> + <edge from-layer="7762" from-port="2" to-layer="7763" to-port="0" /> + <edge from-layer="7763" from-port="1" to-layer="7764" to-port="1" /> + <edge from-layer="7764" from-port="2" to-layer="7765" to-port="1" /> + <edge from-layer="7765" from-port="2" to-layer="7769" to-port="0" /> + <edge from-layer="7765" from-port="2" to-layer="7776" to-port="0" /> + <edge from-layer="7765" from-port="2" to-layer="7813" to-port="0" /> + <edge from-layer="7766" from-port="0" to-layer="7777" to-port="0" /> + <edge from-layer="7767" from-port="0" to-layer="7775" to-port="0" /> + <edge from-layer="7768" from-port="0" to-layer="7769" to-port="1" /> + <edge from-layer="7769" from-port="2" to-layer="7771" to-port="0" /> + <edge from-layer="7770" from-port="0" to-layer="7771" to-port="1" /> + <edge from-layer="7771" from-port="2" to-layer="7773" to-port="0" /> + <edge from-layer="7772" from-port="0" to-layer="7773" to-port="1" /> + <edge from-layer="7773" from-port="2" to-layer="7774" to-port="0" /> + <edge from-layer="7774" from-port="1" to-layer="7775" to-port="1" /> + <edge from-layer="7775" from-port="2" to-layer="7776" to-port="1" /> + <edge from-layer="7776" from-port="2" to-layer="7777" to-port="1" /> + <edge from-layer="7777" from-port="2" to-layer="7800" to-port="0" /> + <edge from-layer="7777" from-port="2" to-layer="7788" to-port="0" /> + <edge from-layer="7778" from-port="0" to-layer="7779" to-port="0" /> + <edge from-layer="7779" from-port="1" to-layer="7782" to-port="0" /> + <edge from-layer="7780" from-port="0" to-layer="7781" to-port="0" /> + <edge from-layer="7781" from-port="1" to-layer="7782" to-port="1" /> + <edge from-layer="7782" from-port="2" to-layer="7784" to-port="0" /> + <edge from-layer="7783" from-port="0" to-layer="7784" to-port="1" /> + <edge from-layer="7784" from-port="2" to-layer="7786" to-port="0" /> + <edge from-layer="7785" from-port="0" to-layer="7786" to-port="1" /> + <edge from-layer="7786" from-port="2" to-layer="7787" to-port="0" /> + <edge from-layer="7787" from-port="1" to-layer="7788" to-port="1" /> + <edge from-layer="7788" from-port="2" to-layer="7789" to-port="0" /> + <edge from-layer="7789" from-port="1" to-layer="7801" to-port="0" /> + <edge from-layer="7790" from-port="0" to-layer="7791" to-port="0" /> + <edge from-layer="7791" from-port="1" to-layer="7794" to-port="0" /> + <edge from-layer="7792" from-port="0" to-layer="7793" to-port="0" /> + <edge from-layer="7793" from-port="1" to-layer="7794" to-port="1" /> + <edge from-layer="7794" from-port="2" to-layer="7796" to-port="0" /> + <edge from-layer="7795" from-port="0" to-layer="7796" to-port="1" /> + <edge from-layer="7796" from-port="2" to-layer="7798" to-port="0" /> + <edge from-layer="7797" from-port="0" to-layer="7798" to-port="1" /> + <edge from-layer="7798" from-port="2" to-layer="7799" to-port="0" /> + <edge from-layer="7799" from-port="1" to-layer="7800" to-port="1" /> + <edge from-layer="7800" from-port="2" to-layer="7801" to-port="1" /> + <edge from-layer="7801" from-port="2" to-layer="7812" to-port="0" /> + <edge from-layer="7802" from-port="0" to-layer="7803" to-port="0" /> + <edge from-layer="7803" from-port="1" to-layer="7806" to-port="0" /> + <edge from-layer="7804" from-port="0" to-layer="7805" to-port="0" /> + <edge from-layer="7805" from-port="1" to-layer="7806" to-port="1" /> + <edge from-layer="7806" from-port="2" to-layer="7808" to-port="0" /> + <edge from-layer="7807" from-port="0" to-layer="7808" to-port="1" /> + <edge from-layer="7808" from-port="2" to-layer="7810" to-port="0" /> + <edge from-layer="7809" from-port="0" to-layer="7810" to-port="1" /> + <edge from-layer="7810" from-port="2" to-layer="7811" to-port="0" /> + <edge from-layer="7811" from-port="1" to-layer="7812" to-port="1" /> + <edge from-layer="7812" from-port="2" to-layer="7813" to-port="1" /> + <edge from-layer="7813" from-port="2" to-layer="7817" to-port="0" /> + <edge from-layer="7813" from-port="2" to-layer="7997" to-port="0" /> + <edge from-layer="7813" from-port="2" to-layer="7824" to-port="0" /> + <edge from-layer="7814" from-port="0" to-layer="7825" to-port="0" /> + <edge from-layer="7815" from-port="0" to-layer="7823" to-port="0" /> + <edge from-layer="7816" from-port="0" to-layer="7817" to-port="1" /> + <edge from-layer="7817" from-port="2" to-layer="7819" to-port="0" /> + <edge from-layer="7818" from-port="0" to-layer="7819" to-port="1" /> + <edge from-layer="7819" from-port="2" to-layer="7821" to-port="0" /> + <edge from-layer="7820" from-port="0" to-layer="7821" to-port="1" /> + <edge from-layer="7821" from-port="2" to-layer="7822" to-port="0" /> + <edge from-layer="7822" from-port="1" to-layer="7823" to-port="1" /> + <edge from-layer="7823" from-port="2" to-layer="7824" to-port="1" /> + <edge from-layer="7824" from-port="2" to-layer="7825" to-port="1" /> + <edge from-layer="7825" from-port="2" to-layer="7946" to-port="0" /> + <edge from-layer="7825" from-port="2" to-layer="7836" to-port="0" /> + <edge from-layer="7825" from-port="2" to-layer="7884" to-port="0" /> + <edge from-layer="7826" from-port="0" to-layer="7827" to-port="0" /> + <edge from-layer="7827" from-port="1" to-layer="7830" to-port="0" /> + <edge from-layer="7828" from-port="0" to-layer="7829" to-port="0" /> + <edge from-layer="7829" from-port="1" to-layer="7830" to-port="1" /> + <edge from-layer="7830" from-port="2" to-layer="7832" to-port="0" /> + <edge from-layer="7831" from-port="0" to-layer="7832" to-port="1" /> + <edge from-layer="7832" from-port="2" to-layer="7834" to-port="0" /> + <edge from-layer="7833" from-port="0" to-layer="7834" to-port="1" /> + <edge from-layer="7834" from-port="2" to-layer="7835" to-port="0" /> + <edge from-layer="7835" from-port="1" to-layer="7836" to-port="1" /> + <edge from-layer="7836" from-port="2" to-layer="7839" to-port="0" /> + <edge from-layer="7837" from-port="0" to-layer="7838" to-port="0" /> + <edge from-layer="7838" from-port="1" to-layer="7839" to-port="1" /> + <edge from-layer="7839" from-port="2" to-layer="7841" to-port="0" /> + <edge from-layer="7840" from-port="0" to-layer="7841" to-port="1" /> + <edge from-layer="7841" from-port="2" to-layer="7843" to-port="0" /> + <edge from-layer="7842" from-port="0" to-layer="7843" to-port="1" /> + <edge from-layer="7843" from-port="2" to-layer="7861" to-port="0" /> + <edge from-layer="7843" from-port="2" to-layer="7855" to-port="0" /> + <edge from-layer="7843" from-port="2" to-layer="7845" to-port="0" /> + <edge from-layer="7843" from-port="2" to-layer="7844" to-port="0" /> + <edge from-layer="7844" from-port="2" to-layer="7864" to-port="0" /> + <edge from-layer="7845" from-port="1" to-layer="7847" to-port="0" /> + <edge from-layer="7846" from-port="0" to-layer="7847" to-port="2" /> + <edge from-layer="7847" from-port="3" to-layer="7848" to-port="0" /> + <edge from-layer="7848" from-port="2" to-layer="7849" to-port="0" /> + <edge from-layer="7849" from-port="1" to-layer="7851" to-port="0" /> + <edge from-layer="7850" from-port="0" to-layer="7851" to-port="1" /> + <edge from-layer="7851" from-port="2" to-layer="7861" to-port="2" /> + <edge from-layer="7851" from-port="2" to-layer="7855" to-port="1" /> + <edge from-layer="7852" from-port="0" to-layer="7855" to-port="2" /> + <edge from-layer="7853" from-port="0" to-layer="7855" to-port="3" /> + <edge from-layer="7854" from-port="0" to-layer="7855" to-port="4" /> + <edge from-layer="7855" from-port="5" to-layer="7857" to-port="0" /> + <edge from-layer="7856" from-port="0" to-layer="7857" to-port="1" /> + <edge from-layer="7857" from-port="2" to-layer="7862" to-port="0" /> + <edge from-layer="7858" from-port="0" to-layer="7861" to-port="1" /> + <edge from-layer="7859" from-port="0" to-layer="7861" to-port="3" /> + <edge from-layer="7860" from-port="0" to-layer="7861" to-port="4" /> + <edge from-layer="7861" from-port="5" to-layer="7862" to-port="1" /> + <edge from-layer="7862" from-port="2" to-layer="7863" to-port="0" /> + <edge from-layer="7863" from-port="2" to-layer="7864" to-port="1" /> + <edge from-layer="7864" from-port="2" to-layer="7981" to-port="0" /> + <edge from-layer="7865" from-port="0" to-layer="7870" to-port="0" /> + <edge from-layer="7866" from-port="0" to-layer="7869" to-port="1" /> + <edge from-layer="7867" from-port="0" to-layer="7869" to-port="2" /> + <edge from-layer="7868" from-port="0" to-layer="7869" to-port="3" /> + <edge from-layer="7869" from-port="4" to-layer="7870" to-port="1" /> + <edge from-layer="7870" from-port="2" to-layer="7871" to-port="0" /> + <edge from-layer="7871" from-port="1" to-layer="7873" to-port="0" /> + <edge from-layer="7872" from-port="0" to-layer="7873" to-port="2" /> + <edge from-layer="7873" from-port="3" to-layer="7913" to-port="0" /> + <edge from-layer="7873" from-port="3" to-layer="7969" to-port="0" /> + <edge from-layer="7874" from-port="0" to-layer="7875" to-port="0" /> + <edge from-layer="7875" from-port="1" to-layer="7878" to-port="0" /> + <edge from-layer="7876" from-port="0" to-layer="7877" to-port="0" /> + <edge from-layer="7877" from-port="1" to-layer="7878" to-port="1" /> + <edge from-layer="7878" from-port="2" to-layer="7880" to-port="0" /> + <edge from-layer="7879" from-port="0" to-layer="7880" to-port="1" /> + <edge from-layer="7880" from-port="2" to-layer="7882" to-port="0" /> + <edge from-layer="7881" from-port="0" to-layer="7882" to-port="1" /> + <edge from-layer="7882" from-port="2" to-layer="7883" to-port="0" /> + <edge from-layer="7883" from-port="1" to-layer="7884" to-port="1" /> + <edge from-layer="7884" from-port="2" to-layer="7887" to-port="0" /> + <edge from-layer="7885" from-port="0" to-layer="7886" to-port="0" /> + <edge from-layer="7886" from-port="1" to-layer="7887" to-port="1" /> + <edge from-layer="7887" from-port="2" to-layer="7889" to-port="0" /> + <edge from-layer="7888" from-port="0" to-layer="7889" to-port="1" /> + <edge from-layer="7889" from-port="2" to-layer="7891" to-port="0" /> + <edge from-layer="7890" from-port="0" to-layer="7891" to-port="1" /> + <edge from-layer="7891" from-port="2" to-layer="7892" to-port="0" /> + <edge from-layer="7891" from-port="2" to-layer="7893" to-port="0" /> + <edge from-layer="7891" from-port="2" to-layer="7903" to-port="0" /> + <edge from-layer="7891" from-port="2" to-layer="7909" to-port="0" /> + <edge from-layer="7892" from-port="2" to-layer="7912" to-port="0" /> + <edge from-layer="7893" from-port="1" to-layer="7895" to-port="0" /> + <edge from-layer="7894" from-port="0" to-layer="7895" to-port="2" /> + <edge from-layer="7895" from-port="3" to-layer="7896" to-port="0" /> + <edge from-layer="7896" from-port="2" to-layer="7897" to-port="0" /> + <edge from-layer="7897" from-port="1" to-layer="7899" to-port="0" /> + <edge from-layer="7898" from-port="0" to-layer="7899" to-port="1" /> + <edge from-layer="7899" from-port="2" to-layer="7903" to-port="1" /> + <edge from-layer="7899" from-port="2" to-layer="7909" to-port="2" /> + <edge from-layer="7900" from-port="0" to-layer="7903" to-port="2" /> + <edge from-layer="7901" from-port="0" to-layer="7903" to-port="3" /> + <edge from-layer="7902" from-port="0" to-layer="7903" to-port="4" /> + <edge from-layer="7903" from-port="5" to-layer="7905" to-port="0" /> + <edge from-layer="7904" from-port="0" to-layer="7905" to-port="1" /> + <edge from-layer="7905" from-port="2" to-layer="7910" to-port="0" /> + <edge from-layer="7906" from-port="0" to-layer="7909" to-port="1" /> + <edge from-layer="7907" from-port="0" to-layer="7909" to-port="3" /> + <edge from-layer="7908" from-port="0" to-layer="7909" to-port="4" /> + <edge from-layer="7909" from-port="5" to-layer="7910" to-port="1" /> + <edge from-layer="7910" from-port="2" to-layer="7911" to-port="0" /> + <edge from-layer="7911" from-port="2" to-layer="7912" to-port="1" /> + <edge from-layer="7912" from-port="2" to-layer="7973" to-port="0" /> + <edge from-layer="7912" from-port="2" to-layer="7913" to-port="1" /> + <edge from-layer="7913" from-port="2" to-layer="7914" to-port="0" /> + <edge from-layer="7913" from-port="2" to-layer="7915" to-port="0" /> + <edge from-layer="7913" from-port="2" to-layer="11172" to-port="0" /> + <edge from-layer="7914" from-port="2" to-layer="7924" to-port="0" /> + <edge from-layer="7915" from-port="1" to-layer="7918" to-port="0" /> + <edge from-layer="7915" from-port="1" to-layer="7922" to-port="0" /> + <edge from-layer="7916" from-port="0" to-layer="7918" to-port="1" /> + <edge from-layer="7917" from-port="0" to-layer="7918" to-port="2" /> + <edge from-layer="7918" from-port="3" to-layer="7923" to-port="0" /> + <edge from-layer="7919" from-port="0" to-layer="7923" to-port="1" /> + <edge from-layer="7920" from-port="0" to-layer="7922" to-port="1" /> + <edge from-layer="7921" from-port="0" to-layer="7922" to-port="2" /> + <edge from-layer="7922" from-port="3" to-layer="7923" to-port="2" /> + <edge from-layer="7923" from-port="3" to-layer="7924" to-port="1" /> + <edge from-layer="7924" from-port="2" to-layer="7926" to-port="0" /> + <edge from-layer="7925" from-port="0" to-layer="7926" to-port="1" /> + <edge from-layer="7926" from-port="2" to-layer="7981" to-port="1" /> + <edge from-layer="7927" from-port="0" to-layer="7932" to-port="0" /> + <edge from-layer="7928" from-port="0" to-layer="7931" to-port="1" /> + <edge from-layer="7929" from-port="0" to-layer="7931" to-port="2" /> + <edge from-layer="7930" from-port="0" to-layer="7931" to-port="3" /> + <edge from-layer="7931" from-port="4" to-layer="7932" to-port="1" /> + <edge from-layer="7932" from-port="2" to-layer="7933" to-port="0" /> + <edge from-layer="7933" from-port="1" to-layer="7935" to-port="0" /> + <edge from-layer="7934" from-port="0" to-layer="7935" to-port="2" /> + <edge from-layer="7935" from-port="3" to-layer="7954" to-port="0" /> + <edge from-layer="7936" from-port="0" to-layer="7937" to-port="0" /> + <edge from-layer="7937" from-port="1" to-layer="7940" to-port="0" /> + <edge from-layer="7938" from-port="0" to-layer="7939" to-port="0" /> + <edge from-layer="7939" from-port="1" to-layer="7940" to-port="1" /> + <edge from-layer="7940" from-port="2" to-layer="7942" to-port="0" /> + <edge from-layer="7941" from-port="0" to-layer="7942" to-port="1" /> + <edge from-layer="7942" from-port="2" to-layer="7944" to-port="0" /> + <edge from-layer="7943" from-port="0" to-layer="7944" to-port="1" /> + <edge from-layer="7944" from-port="2" to-layer="7945" to-port="0" /> + <edge from-layer="7945" from-port="1" to-layer="7946" to-port="1" /> + <edge from-layer="7946" from-port="2" to-layer="7949" to-port="0" /> + <edge from-layer="7947" from-port="0" to-layer="7948" to-port="0" /> + <edge from-layer="7948" from-port="1" to-layer="7949" to-port="1" /> + <edge from-layer="7949" from-port="2" to-layer="7951" to-port="0" /> + <edge from-layer="7950" from-port="0" to-layer="7951" to-port="1" /> + <edge from-layer="7951" from-port="2" to-layer="7953" to-port="0" /> + <edge from-layer="7952" from-port="0" to-layer="7953" to-port="1" /> + <edge from-layer="7953" from-port="2" to-layer="7954" to-port="1" /> + <edge from-layer="7954" from-port="2" to-layer="7955" to-port="0" /> + <edge from-layer="7954" from-port="2" to-layer="7956" to-port="0" /> + <edge from-layer="7954" from-port="2" to-layer="11171" to-port="0" /> + <edge from-layer="7955" from-port="2" to-layer="7965" to-port="0" /> + <edge from-layer="7956" from-port="1" to-layer="7963" to-port="0" /> + <edge from-layer="7956" from-port="1" to-layer="7959" to-port="0" /> + <edge from-layer="7957" from-port="0" to-layer="7959" to-port="1" /> + <edge from-layer="7958" from-port="0" to-layer="7959" to-port="2" /> + <edge from-layer="7959" from-port="3" to-layer="7964" to-port="1" /> + <edge from-layer="7960" from-port="0" to-layer="7964" to-port="2" /> + <edge from-layer="7961" from-port="0" to-layer="7963" to-port="1" /> + <edge from-layer="7962" from-port="0" to-layer="7963" to-port="2" /> + <edge from-layer="7963" from-port="3" to-layer="7964" to-port="3" /> + <edge from-layer="7964" from-port="4" to-layer="7965" to-port="1" /> + <edge from-layer="7965" from-port="2" to-layer="7967" to-port="0" /> + <edge from-layer="7966" from-port="0" to-layer="7967" to-port="1" /> + <edge from-layer="7967" from-port="2" to-layer="7981" to-port="2" /> + <edge from-layer="7968" from-port="0" to-layer="7980" to-port="1" /> + <edge from-layer="7969" from-port="1" to-layer="7972" to-port="0" /> + <edge from-layer="7970" from-port="0" to-layer="7972" to-port="1" /> + <edge from-layer="7971" from-port="0" to-layer="7972" to-port="2" /> + <edge from-layer="7972" from-port="3" to-layer="7977" to-port="0" /> + <edge from-layer="7973" from-port="1" to-layer="7976" to-port="0" /> + <edge from-layer="7974" from-port="0" to-layer="7976" to-port="1" /> + <edge from-layer="7975" from-port="0" to-layer="7976" to-port="2" /> + <edge from-layer="7976" from-port="3" to-layer="7977" to-port="1" /> + <edge from-layer="7977" from-port="2" to-layer="7980" to-port="2" /> + <edge from-layer="7978" from-port="0" to-layer="7980" to-port="3" /> + <edge from-layer="7979" from-port="0" to-layer="7980" to-port="4" /> + <edge from-layer="7980" from-port="5" to-layer="7981" to-port="3" /> + <edge from-layer="7981" from-port="4" to-layer="7983" to-port="0" /> + <edge from-layer="7982" from-port="0" to-layer="7983" to-port="1" /> + <edge from-layer="7983" from-port="2" to-layer="7985" to-port="0" /> + <edge from-layer="7984" from-port="0" to-layer="7985" to-port="1" /> + <edge from-layer="7985" from-port="2" to-layer="7996" to-port="0" /> + <edge from-layer="7986" from-port="0" to-layer="7987" to-port="0" /> + <edge from-layer="7987" from-port="1" to-layer="7990" to-port="0" /> + <edge from-layer="7988" from-port="0" to-layer="7989" to-port="0" /> + <edge from-layer="7989" from-port="1" to-layer="7990" to-port="1" /> + <edge from-layer="7990" from-port="2" to-layer="7992" to-port="0" /> + <edge from-layer="7991" from-port="0" to-layer="7992" to-port="1" /> + <edge from-layer="7992" from-port="2" to-layer="7994" to-port="0" /> + <edge from-layer="7993" from-port="0" to-layer="7994" to-port="1" /> + <edge from-layer="7994" from-port="2" to-layer="7995" to-port="0" /> + <edge from-layer="7995" from-port="1" to-layer="7996" to-port="1" /> + <edge from-layer="7996" from-port="2" to-layer="7997" to-port="1" /> + <edge from-layer="7997" from-port="2" to-layer="8045" to-port="0" /> + <edge from-layer="7997" from-port="2" to-layer="8001" to-port="0" /> + <edge from-layer="7997" from-port="2" to-layer="8008" to-port="0" /> + <edge from-layer="7998" from-port="0" to-layer="8009" to-port="0" /> + <edge from-layer="7999" from-port="0" to-layer="8007" to-port="0" /> + <edge from-layer="8000" from-port="0" to-layer="8001" to-port="1" /> + <edge from-layer="8001" from-port="2" to-layer="8003" to-port="0" /> + <edge from-layer="8002" from-port="0" to-layer="8003" to-port="1" /> + <edge from-layer="8003" from-port="2" to-layer="8005" to-port="0" /> + <edge from-layer="8004" from-port="0" to-layer="8005" to-port="1" /> + <edge from-layer="8005" from-port="2" to-layer="8006" to-port="0" /> + <edge from-layer="8006" from-port="1" to-layer="8007" to-port="1" /> + <edge from-layer="8007" from-port="2" to-layer="8008" to-port="1" /> + <edge from-layer="8008" from-port="2" to-layer="8009" to-port="1" /> + <edge from-layer="8009" from-port="2" to-layer="8032" to-port="0" /> + <edge from-layer="8009" from-port="2" to-layer="8020" to-port="0" /> + <edge from-layer="8010" from-port="0" to-layer="8011" to-port="0" /> + <edge from-layer="8011" from-port="1" to-layer="8014" to-port="0" /> + <edge from-layer="8012" from-port="0" to-layer="8013" to-port="0" /> + <edge from-layer="8013" from-port="1" to-layer="8014" to-port="1" /> + <edge from-layer="8014" from-port="2" to-layer="8016" to-port="0" /> + <edge from-layer="8015" from-port="0" to-layer="8016" to-port="1" /> + <edge from-layer="8016" from-port="2" to-layer="8018" to-port="0" /> + <edge from-layer="8017" from-port="0" to-layer="8018" to-port="1" /> + <edge from-layer="8018" from-port="2" to-layer="8019" to-port="0" /> + <edge from-layer="8019" from-port="1" to-layer="8020" to-port="1" /> + <edge from-layer="8020" from-port="2" to-layer="8021" to-port="0" /> + <edge from-layer="8021" from-port="1" to-layer="8033" to-port="0" /> + <edge from-layer="8022" from-port="0" to-layer="8023" to-port="0" /> + <edge from-layer="8023" from-port="1" to-layer="8026" to-port="0" /> + <edge from-layer="8024" from-port="0" to-layer="8025" to-port="0" /> + <edge from-layer="8025" from-port="1" to-layer="8026" to-port="1" /> + <edge from-layer="8026" from-port="2" to-layer="8028" to-port="0" /> + <edge from-layer="8027" from-port="0" to-layer="8028" to-port="1" /> + <edge from-layer="8028" from-port="2" to-layer="8030" to-port="0" /> + <edge from-layer="8029" from-port="0" to-layer="8030" to-port="1" /> + <edge from-layer="8030" from-port="2" to-layer="8031" to-port="0" /> + <edge from-layer="8031" from-port="1" to-layer="8032" to-port="1" /> + <edge from-layer="8032" from-port="2" to-layer="8033" to-port="1" /> + <edge from-layer="8033" from-port="2" to-layer="8044" to-port="0" /> + <edge from-layer="8034" from-port="0" to-layer="8035" to-port="0" /> + <edge from-layer="8035" from-port="1" to-layer="8038" to-port="0" /> + <edge from-layer="8036" from-port="0" to-layer="8037" to-port="0" /> + <edge from-layer="8037" from-port="1" to-layer="8038" to-port="1" /> + <edge from-layer="8038" from-port="2" to-layer="8040" to-port="0" /> + <edge from-layer="8039" from-port="0" to-layer="8040" to-port="1" /> + <edge from-layer="8040" from-port="2" to-layer="8042" to-port="0" /> + <edge from-layer="8041" from-port="0" to-layer="8042" to-port="1" /> + <edge from-layer="8042" from-port="2" to-layer="8043" to-port="0" /> + <edge from-layer="8043" from-port="1" to-layer="8044" to-port="1" /> + <edge from-layer="8044" from-port="2" to-layer="8045" to-port="1" /> + <edge from-layer="8045" from-port="2" to-layer="8056" to-port="0" /> + <edge from-layer="8045" from-port="2" to-layer="8049" to-port="0" /> + <edge from-layer="8045" from-port="2" to-layer="8229" to-port="0" /> + <edge from-layer="8046" from-port="0" to-layer="8057" to-port="0" /> + <edge from-layer="8047" from-port="0" to-layer="8055" to-port="0" /> + <edge from-layer="8048" from-port="0" to-layer="8049" to-port="1" /> + <edge from-layer="8049" from-port="2" to-layer="8051" to-port="0" /> + <edge from-layer="8050" from-port="0" to-layer="8051" to-port="1" /> + <edge from-layer="8051" from-port="2" to-layer="8053" to-port="0" /> + <edge from-layer="8052" from-port="0" to-layer="8053" to-port="1" /> + <edge from-layer="8053" from-port="2" to-layer="8054" to-port="0" /> + <edge from-layer="8054" from-port="1" to-layer="8055" to-port="1" /> + <edge from-layer="8055" from-port="2" to-layer="8056" to-port="1" /> + <edge from-layer="8056" from-port="2" to-layer="8057" to-port="1" /> + <edge from-layer="8057" from-port="2" to-layer="8178" to-port="0" /> + <edge from-layer="8057" from-port="2" to-layer="8116" to-port="0" /> + <edge from-layer="8057" from-port="2" to-layer="8068" to-port="0" /> + <edge from-layer="8058" from-port="0" to-layer="8059" to-port="0" /> + <edge from-layer="8059" from-port="1" to-layer="8062" to-port="0" /> + <edge from-layer="8060" from-port="0" to-layer="8061" to-port="0" /> + <edge from-layer="8061" from-port="1" to-layer="8062" to-port="1" /> + <edge from-layer="8062" from-port="2" to-layer="8064" to-port="0" /> + <edge from-layer="8063" from-port="0" to-layer="8064" to-port="1" /> + <edge from-layer="8064" from-port="2" to-layer="8066" to-port="0" /> + <edge from-layer="8065" from-port="0" to-layer="8066" to-port="1" /> + <edge from-layer="8066" from-port="2" to-layer="8067" to-port="0" /> + <edge from-layer="8067" from-port="1" to-layer="8068" to-port="1" /> + <edge from-layer="8068" from-port="2" to-layer="8071" to-port="0" /> + <edge from-layer="8069" from-port="0" to-layer="8070" to-port="0" /> + <edge from-layer="8070" from-port="1" to-layer="8071" to-port="1" /> + <edge from-layer="8071" from-port="2" to-layer="8073" to-port="0" /> + <edge from-layer="8072" from-port="0" to-layer="8073" to-port="1" /> + <edge from-layer="8073" from-port="2" to-layer="8075" to-port="0" /> + <edge from-layer="8074" from-port="0" to-layer="8075" to-port="1" /> + <edge from-layer="8075" from-port="2" to-layer="8077" to-port="0" /> + <edge from-layer="8075" from-port="2" to-layer="8076" to-port="0" /> + <edge from-layer="8075" from-port="2" to-layer="8093" to-port="0" /> + <edge from-layer="8075" from-port="2" to-layer="8087" to-port="0" /> + <edge from-layer="8076" from-port="2" to-layer="8096" to-port="0" /> + <edge from-layer="8077" from-port="1" to-layer="8079" to-port="0" /> + <edge from-layer="8078" from-port="0" to-layer="8079" to-port="2" /> + <edge from-layer="8079" from-port="3" to-layer="8080" to-port="0" /> + <edge from-layer="8080" from-port="2" to-layer="8081" to-port="0" /> + <edge from-layer="8081" from-port="1" to-layer="8083" to-port="0" /> + <edge from-layer="8082" from-port="0" to-layer="8083" to-port="1" /> + <edge from-layer="8083" from-port="2" to-layer="8093" to-port="2" /> + <edge from-layer="8083" from-port="2" to-layer="8087" to-port="1" /> + <edge from-layer="8084" from-port="0" to-layer="8087" to-port="2" /> + <edge from-layer="8085" from-port="0" to-layer="8087" to-port="3" /> + <edge from-layer="8086" from-port="0" to-layer="8087" to-port="4" /> + <edge from-layer="8087" from-port="5" to-layer="8089" to-port="0" /> + <edge from-layer="8088" from-port="0" to-layer="8089" to-port="1" /> + <edge from-layer="8089" from-port="2" to-layer="8094" to-port="0" /> + <edge from-layer="8090" from-port="0" to-layer="8093" to-port="1" /> + <edge from-layer="8091" from-port="0" to-layer="8093" to-port="3" /> + <edge from-layer="8092" from-port="0" to-layer="8093" to-port="4" /> + <edge from-layer="8093" from-port="5" to-layer="8094" to-port="1" /> + <edge from-layer="8094" from-port="2" to-layer="8095" to-port="0" /> + <edge from-layer="8095" from-port="2" to-layer="8096" to-port="1" /> + <edge from-layer="8096" from-port="2" to-layer="8213" to-port="0" /> + <edge from-layer="8097" from-port="0" to-layer="8102" to-port="0" /> + <edge from-layer="8098" from-port="0" to-layer="8101" to-port="1" /> + <edge from-layer="8099" from-port="0" to-layer="8101" to-port="2" /> + <edge from-layer="8100" from-port="0" to-layer="8101" to-port="3" /> + <edge from-layer="8101" from-port="4" to-layer="8102" to-port="1" /> + <edge from-layer="8102" from-port="2" to-layer="8103" to-port="0" /> + <edge from-layer="8103" from-port="1" to-layer="8105" to-port="0" /> + <edge from-layer="8104" from-port="0" to-layer="8105" to-port="2" /> + <edge from-layer="8105" from-port="3" to-layer="8145" to-port="0" /> + <edge from-layer="8105" from-port="3" to-layer="8201" to-port="0" /> + <edge from-layer="8106" from-port="0" to-layer="8107" to-port="0" /> + <edge from-layer="8107" from-port="1" to-layer="8110" to-port="0" /> + <edge from-layer="8108" from-port="0" to-layer="8109" to-port="0" /> + <edge from-layer="8109" from-port="1" to-layer="8110" to-port="1" /> + <edge from-layer="8110" from-port="2" to-layer="8112" to-port="0" /> + <edge from-layer="8111" from-port="0" to-layer="8112" to-port="1" /> + <edge from-layer="8112" from-port="2" to-layer="8114" to-port="0" /> + <edge from-layer="8113" from-port="0" to-layer="8114" to-port="1" /> + <edge from-layer="8114" from-port="2" to-layer="8115" to-port="0" /> + <edge from-layer="8115" from-port="1" to-layer="8116" to-port="1" /> + <edge from-layer="8116" from-port="2" to-layer="8119" to-port="0" /> + <edge from-layer="8117" from-port="0" to-layer="8118" to-port="0" /> + <edge from-layer="8118" from-port="1" to-layer="8119" to-port="1" /> + <edge from-layer="8119" from-port="2" to-layer="8121" to-port="0" /> + <edge from-layer="8120" from-port="0" to-layer="8121" to-port="1" /> + <edge from-layer="8121" from-port="2" to-layer="8123" to-port="0" /> + <edge from-layer="8122" from-port="0" to-layer="8123" to-port="1" /> + <edge from-layer="8123" from-port="2" to-layer="8135" to-port="0" /> + <edge from-layer="8123" from-port="2" to-layer="8124" to-port="0" /> + <edge from-layer="8123" from-port="2" to-layer="8141" to-port="0" /> + <edge from-layer="8123" from-port="2" to-layer="8125" to-port="0" /> + <edge from-layer="8124" from-port="2" to-layer="8144" to-port="0" /> + <edge from-layer="8125" from-port="1" to-layer="8127" to-port="0" /> + <edge from-layer="8126" from-port="0" to-layer="8127" to-port="2" /> + <edge from-layer="8127" from-port="3" to-layer="8128" to-port="0" /> + <edge from-layer="8128" from-port="2" to-layer="8129" to-port="0" /> + <edge from-layer="8129" from-port="1" to-layer="8131" to-port="0" /> + <edge from-layer="8130" from-port="0" to-layer="8131" to-port="1" /> + <edge from-layer="8131" from-port="2" to-layer="8135" to-port="1" /> + <edge from-layer="8131" from-port="2" to-layer="8141" to-port="2" /> + <edge from-layer="8132" from-port="0" to-layer="8135" to-port="2" /> + <edge from-layer="8133" from-port="0" to-layer="8135" to-port="3" /> + <edge from-layer="8134" from-port="0" to-layer="8135" to-port="4" /> + <edge from-layer="8135" from-port="5" to-layer="8137" to-port="0" /> + <edge from-layer="8136" from-port="0" to-layer="8137" to-port="1" /> + <edge from-layer="8137" from-port="2" to-layer="8142" to-port="0" /> + <edge from-layer="8138" from-port="0" to-layer="8141" to-port="1" /> + <edge from-layer="8139" from-port="0" to-layer="8141" to-port="3" /> + <edge from-layer="8140" from-port="0" to-layer="8141" to-port="4" /> + <edge from-layer="8141" from-port="5" to-layer="8142" to-port="1" /> + <edge from-layer="8142" from-port="2" to-layer="8143" to-port="0" /> + <edge from-layer="8143" from-port="2" to-layer="8144" to-port="1" /> + <edge from-layer="8144" from-port="2" to-layer="8145" to-port="1" /> + <edge from-layer="8144" from-port="2" to-layer="8205" to-port="0" /> + <edge from-layer="8145" from-port="2" to-layer="8146" to-port="0" /> + <edge from-layer="8145" from-port="2" to-layer="8147" to-port="0" /> + <edge from-layer="8145" from-port="2" to-layer="11170" to-port="0" /> + <edge from-layer="8146" from-port="2" to-layer="8156" to-port="0" /> + <edge from-layer="8147" from-port="1" to-layer="8150" to-port="0" /> + <edge from-layer="8147" from-port="1" to-layer="8154" to-port="0" /> + <edge from-layer="8148" from-port="0" to-layer="8150" to-port="1" /> + <edge from-layer="8149" from-port="0" to-layer="8150" to-port="2" /> + <edge from-layer="8150" from-port="3" to-layer="8155" to-port="0" /> + <edge from-layer="8151" from-port="0" to-layer="8155" to-port="1" /> + <edge from-layer="8152" from-port="0" to-layer="8154" to-port="1" /> + <edge from-layer="8153" from-port="0" to-layer="8154" to-port="2" /> + <edge from-layer="8154" from-port="3" to-layer="8155" to-port="2" /> + <edge from-layer="8155" from-port="3" to-layer="8156" to-port="1" /> + <edge from-layer="8156" from-port="2" to-layer="8158" to-port="0" /> + <edge from-layer="8157" from-port="0" to-layer="8158" to-port="1" /> + <edge from-layer="8158" from-port="2" to-layer="8213" to-port="1" /> + <edge from-layer="8159" from-port="0" to-layer="8164" to-port="0" /> + <edge from-layer="8160" from-port="0" to-layer="8163" to-port="1" /> + <edge from-layer="8161" from-port="0" to-layer="8163" to-port="2" /> + <edge from-layer="8162" from-port="0" to-layer="8163" to-port="3" /> + <edge from-layer="8163" from-port="4" to-layer="8164" to-port="1" /> + <edge from-layer="8164" from-port="2" to-layer="8165" to-port="0" /> + <edge from-layer="8165" from-port="1" to-layer="8167" to-port="0" /> + <edge from-layer="8166" from-port="0" to-layer="8167" to-port="2" /> + <edge from-layer="8167" from-port="3" to-layer="8186" to-port="0" /> + <edge from-layer="8168" from-port="0" to-layer="8169" to-port="0" /> + <edge from-layer="8169" from-port="1" to-layer="8172" to-port="0" /> + <edge from-layer="8170" from-port="0" to-layer="8171" to-port="0" /> + <edge from-layer="8171" from-port="1" to-layer="8172" to-port="1" /> + <edge from-layer="8172" from-port="2" to-layer="8174" to-port="0" /> + <edge from-layer="8173" from-port="0" to-layer="8174" to-port="1" /> + <edge from-layer="8174" from-port="2" to-layer="8176" to-port="0" /> + <edge from-layer="8175" from-port="0" to-layer="8176" to-port="1" /> + <edge from-layer="8176" from-port="2" to-layer="8177" to-port="0" /> + <edge from-layer="8177" from-port="1" to-layer="8178" to-port="1" /> + <edge from-layer="8178" from-port="2" to-layer="8181" to-port="0" /> + <edge from-layer="8179" from-port="0" to-layer="8180" to-port="0" /> + <edge from-layer="8180" from-port="1" to-layer="8181" to-port="1" /> + <edge from-layer="8181" from-port="2" to-layer="8183" to-port="0" /> + <edge from-layer="8182" from-port="0" to-layer="8183" to-port="1" /> + <edge from-layer="8183" from-port="2" to-layer="8185" to-port="0" /> + <edge from-layer="8184" from-port="0" to-layer="8185" to-port="1" /> + <edge from-layer="8185" from-port="2" to-layer="8186" to-port="1" /> + <edge from-layer="8186" from-port="2" to-layer="8188" to-port="0" /> + <edge from-layer="8186" from-port="2" to-layer="11169" to-port="0" /> + <edge from-layer="8186" from-port="2" to-layer="8187" to-port="0" /> + <edge from-layer="8187" from-port="2" to-layer="8197" to-port="0" /> + <edge from-layer="8188" from-port="1" to-layer="8191" to-port="0" /> + <edge from-layer="8188" from-port="1" to-layer="8195" to-port="0" /> + <edge from-layer="8189" from-port="0" to-layer="8191" to-port="1" /> + <edge from-layer="8190" from-port="0" to-layer="8191" to-port="2" /> + <edge from-layer="8191" from-port="3" to-layer="8196" to-port="1" /> + <edge from-layer="8192" from-port="0" to-layer="8196" to-port="2" /> + <edge from-layer="8193" from-port="0" to-layer="8195" to-port="1" /> + <edge from-layer="8194" from-port="0" to-layer="8195" to-port="2" /> + <edge from-layer="8195" from-port="3" to-layer="8196" to-port="3" /> + <edge from-layer="8196" from-port="4" to-layer="8197" to-port="1" /> + <edge from-layer="8197" from-port="2" to-layer="8199" to-port="0" /> + <edge from-layer="8198" from-port="0" to-layer="8199" to-port="1" /> + <edge from-layer="8199" from-port="2" to-layer="8213" to-port="2" /> + <edge from-layer="8200" from-port="0" to-layer="8212" to-port="1" /> + <edge from-layer="8201" from-port="1" to-layer="8204" to-port="0" /> + <edge from-layer="8202" from-port="0" to-layer="8204" to-port="1" /> + <edge from-layer="8203" from-port="0" to-layer="8204" to-port="2" /> + <edge from-layer="8204" from-port="3" to-layer="8209" to-port="0" /> + <edge from-layer="8205" from-port="1" to-layer="8208" to-port="0" /> + <edge from-layer="8206" from-port="0" to-layer="8208" to-port="1" /> + <edge from-layer="8207" from-port="0" to-layer="8208" to-port="2" /> + <edge from-layer="8208" from-port="3" to-layer="8209" to-port="1" /> + <edge from-layer="8209" from-port="2" to-layer="8212" to-port="2" /> + <edge from-layer="8210" from-port="0" to-layer="8212" to-port="3" /> + <edge from-layer="8211" from-port="0" to-layer="8212" to-port="4" /> + <edge from-layer="8212" from-port="5" to-layer="8213" to-port="3" /> + <edge from-layer="8213" from-port="4" to-layer="8215" to-port="0" /> + <edge from-layer="8214" from-port="0" to-layer="8215" to-port="1" /> + <edge from-layer="8215" from-port="2" to-layer="8217" to-port="0" /> + <edge from-layer="8216" from-port="0" to-layer="8217" to-port="1" /> + <edge from-layer="8217" from-port="2" to-layer="8228" to-port="0" /> + <edge from-layer="8218" from-port="0" to-layer="8219" to-port="0" /> + <edge from-layer="8219" from-port="1" to-layer="8222" to-port="0" /> + <edge from-layer="8220" from-port="0" to-layer="8221" to-port="0" /> + <edge from-layer="8221" from-port="1" to-layer="8222" to-port="1" /> + <edge from-layer="8222" from-port="2" to-layer="8224" to-port="0" /> + <edge from-layer="8223" from-port="0" to-layer="8224" to-port="1" /> + <edge from-layer="8224" from-port="2" to-layer="8226" to-port="0" /> + <edge from-layer="8225" from-port="0" to-layer="8226" to-port="1" /> + <edge from-layer="8226" from-port="2" to-layer="8227" to-port="0" /> + <edge from-layer="8227" from-port="1" to-layer="8228" to-port="1" /> + <edge from-layer="8228" from-port="2" to-layer="8229" to-port="1" /> + <edge from-layer="8229" from-port="2" to-layer="8233" to-port="0" /> + <edge from-layer="8229" from-port="2" to-layer="8277" to-port="0" /> + <edge from-layer="8229" from-port="2" to-layer="8240" to-port="0" /> + <edge from-layer="8230" from-port="0" to-layer="8241" to-port="0" /> + <edge from-layer="8231" from-port="0" to-layer="8239" to-port="0" /> + <edge from-layer="8232" from-port="0" to-layer="8233" to-port="1" /> + <edge from-layer="8233" from-port="2" to-layer="8235" to-port="0" /> + <edge from-layer="8234" from-port="0" to-layer="8235" to-port="1" /> + <edge from-layer="8235" from-port="2" to-layer="8237" to-port="0" /> + <edge from-layer="8236" from-port="0" to-layer="8237" to-port="1" /> + <edge from-layer="8237" from-port="2" to-layer="8238" to-port="0" /> + <edge from-layer="8238" from-port="1" to-layer="8239" to-port="1" /> + <edge from-layer="8239" from-port="2" to-layer="8240" to-port="1" /> + <edge from-layer="8240" from-port="2" to-layer="8241" to-port="1" /> + <edge from-layer="8241" from-port="2" to-layer="8264" to-port="0" /> + <edge from-layer="8241" from-port="2" to-layer="8252" to-port="0" /> + <edge from-layer="8242" from-port="0" to-layer="8243" to-port="0" /> + <edge from-layer="8243" from-port="1" to-layer="8246" to-port="0" /> + <edge from-layer="8244" from-port="0" to-layer="8245" to-port="0" /> + <edge from-layer="8245" from-port="1" to-layer="8246" to-port="1" /> + <edge from-layer="8246" from-port="2" to-layer="8248" to-port="0" /> + <edge from-layer="8247" from-port="0" to-layer="8248" to-port="1" /> + <edge from-layer="8248" from-port="2" to-layer="8250" to-port="0" /> + <edge from-layer="8249" from-port="0" to-layer="8250" to-port="1" /> + <edge from-layer="8250" from-port="2" to-layer="8251" to-port="0" /> + <edge from-layer="8251" from-port="1" to-layer="8252" to-port="1" /> + <edge from-layer="8252" from-port="2" to-layer="8253" to-port="0" /> + <edge from-layer="8253" from-port="1" to-layer="8265" to-port="0" /> + <edge from-layer="8254" from-port="0" to-layer="8255" to-port="0" /> + <edge from-layer="8255" from-port="1" to-layer="8258" to-port="0" /> + <edge from-layer="8256" from-port="0" to-layer="8257" to-port="0" /> + <edge from-layer="8257" from-port="1" to-layer="8258" to-port="1" /> + <edge from-layer="8258" from-port="2" to-layer="8260" to-port="0" /> + <edge from-layer="8259" from-port="0" to-layer="8260" to-port="1" /> + <edge from-layer="8260" from-port="2" to-layer="8262" to-port="0" /> + <edge from-layer="8261" from-port="0" to-layer="8262" to-port="1" /> + <edge from-layer="8262" from-port="2" to-layer="8263" to-port="0" /> + <edge from-layer="8263" from-port="1" to-layer="8264" to-port="1" /> + <edge from-layer="8264" from-port="2" to-layer="8265" to-port="1" /> + <edge from-layer="8265" from-port="2" to-layer="8276" to-port="0" /> + <edge from-layer="8266" from-port="0" to-layer="8267" to-port="0" /> + <edge from-layer="8267" from-port="1" to-layer="8270" to-port="0" /> + <edge from-layer="8268" from-port="0" to-layer="8269" to-port="0" /> + <edge from-layer="8269" from-port="1" to-layer="8270" to-port="1" /> + <edge from-layer="8270" from-port="2" to-layer="8272" to-port="0" /> + <edge from-layer="8271" from-port="0" to-layer="8272" to-port="1" /> + <edge from-layer="8272" from-port="2" to-layer="8274" to-port="0" /> + <edge from-layer="8273" from-port="0" to-layer="8274" to-port="1" /> + <edge from-layer="8274" from-port="2" to-layer="8275" to-port="0" /> + <edge from-layer="8275" from-port="1" to-layer="8276" to-port="1" /> + <edge from-layer="8276" from-port="2" to-layer="8277" to-port="1" /> + <edge from-layer="8277" from-port="2" to-layer="8461" to-port="0" /> + <edge from-layer="8277" from-port="2" to-layer="8281" to-port="0" /> + <edge from-layer="8277" from-port="2" to-layer="8288" to-port="0" /> + <edge from-layer="8278" from-port="0" to-layer="8289" to-port="0" /> + <edge from-layer="8279" from-port="0" to-layer="8287" to-port="0" /> + <edge from-layer="8280" from-port="0" to-layer="8281" to-port="1" /> + <edge from-layer="8281" from-port="2" to-layer="8283" to-port="0" /> + <edge from-layer="8282" from-port="0" to-layer="8283" to-port="1" /> + <edge from-layer="8283" from-port="2" to-layer="8285" to-port="0" /> + <edge from-layer="8284" from-port="0" to-layer="8285" to-port="1" /> + <edge from-layer="8285" from-port="2" to-layer="8286" to-port="0" /> + <edge from-layer="8286" from-port="1" to-layer="8287" to-port="1" /> + <edge from-layer="8287" from-port="2" to-layer="8288" to-port="1" /> + <edge from-layer="8288" from-port="2" to-layer="8289" to-port="1" /> + <edge from-layer="8289" from-port="2" to-layer="8410" to-port="0" /> + <edge from-layer="8289" from-port="2" to-layer="8348" to-port="0" /> + <edge from-layer="8289" from-port="2" to-layer="8300" to-port="0" /> + <edge from-layer="8290" from-port="0" to-layer="8291" to-port="0" /> + <edge from-layer="8291" from-port="1" to-layer="8294" to-port="0" /> + <edge from-layer="8292" from-port="0" to-layer="8293" to-port="0" /> + <edge from-layer="8293" from-port="1" to-layer="8294" to-port="1" /> + <edge from-layer="8294" from-port="2" to-layer="8296" to-port="0" /> + <edge from-layer="8295" from-port="0" to-layer="8296" to-port="1" /> + <edge from-layer="8296" from-port="2" to-layer="8298" to-port="0" /> + <edge from-layer="8297" from-port="0" to-layer="8298" to-port="1" /> + <edge from-layer="8298" from-port="2" to-layer="8299" to-port="0" /> + <edge from-layer="8299" from-port="1" to-layer="8300" to-port="1" /> + <edge from-layer="8300" from-port="2" to-layer="8303" to-port="0" /> + <edge from-layer="8301" from-port="0" to-layer="8302" to-port="0" /> + <edge from-layer="8302" from-port="1" to-layer="8303" to-port="1" /> + <edge from-layer="8303" from-port="2" to-layer="8305" to-port="0" /> + <edge from-layer="8304" from-port="0" to-layer="8305" to-port="1" /> + <edge from-layer="8305" from-port="2" to-layer="8307" to-port="0" /> + <edge from-layer="8306" from-port="0" to-layer="8307" to-port="1" /> + <edge from-layer="8307" from-port="2" to-layer="8319" to-port="0" /> + <edge from-layer="8307" from-port="2" to-layer="8325" to-port="0" /> + <edge from-layer="8307" from-port="2" to-layer="8309" to-port="0" /> + <edge from-layer="8307" from-port="2" to-layer="8308" to-port="0" /> + <edge from-layer="8308" from-port="2" to-layer="8328" to-port="0" /> + <edge from-layer="8309" from-port="1" to-layer="8311" to-port="0" /> + <edge from-layer="8310" from-port="0" to-layer="8311" to-port="2" /> + <edge from-layer="8311" from-port="3" to-layer="8312" to-port="0" /> + <edge from-layer="8312" from-port="2" to-layer="8313" to-port="0" /> + <edge from-layer="8313" from-port="1" to-layer="8315" to-port="0" /> + <edge from-layer="8314" from-port="0" to-layer="8315" to-port="1" /> + <edge from-layer="8315" from-port="2" to-layer="8319" to-port="1" /> + <edge from-layer="8315" from-port="2" to-layer="8325" to-port="2" /> + <edge from-layer="8316" from-port="0" to-layer="8319" to-port="2" /> + <edge from-layer="8317" from-port="0" to-layer="8319" to-port="3" /> + <edge from-layer="8318" from-port="0" to-layer="8319" to-port="4" /> + <edge from-layer="8319" from-port="5" to-layer="8321" to-port="0" /> + <edge from-layer="8320" from-port="0" to-layer="8321" to-port="1" /> + <edge from-layer="8321" from-port="2" to-layer="8326" to-port="0" /> + <edge from-layer="8322" from-port="0" to-layer="8325" to-port="1" /> + <edge from-layer="8323" from-port="0" to-layer="8325" to-port="3" /> + <edge from-layer="8324" from-port="0" to-layer="8325" to-port="4" /> + <edge from-layer="8325" from-port="5" to-layer="8326" to-port="1" /> + <edge from-layer="8326" from-port="2" to-layer="8327" to-port="0" /> + <edge from-layer="8327" from-port="2" to-layer="8328" to-port="1" /> + <edge from-layer="8328" from-port="2" to-layer="8445" to-port="0" /> + <edge from-layer="8329" from-port="0" to-layer="8334" to-port="0" /> + <edge from-layer="8330" from-port="0" to-layer="8333" to-port="1" /> + <edge from-layer="8331" from-port="0" to-layer="8333" to-port="2" /> + <edge from-layer="8332" from-port="0" to-layer="8333" to-port="3" /> + <edge from-layer="8333" from-port="4" to-layer="8334" to-port="1" /> + <edge from-layer="8334" from-port="2" to-layer="8335" to-port="0" /> + <edge from-layer="8335" from-port="1" to-layer="8337" to-port="0" /> + <edge from-layer="8336" from-port="0" to-layer="8337" to-port="2" /> + <edge from-layer="8337" from-port="3" to-layer="8433" to-port="0" /> + <edge from-layer="8337" from-port="3" to-layer="8377" to-port="0" /> + <edge from-layer="8338" from-port="0" to-layer="8339" to-port="0" /> + <edge from-layer="8339" from-port="1" to-layer="8342" to-port="0" /> + <edge from-layer="8340" from-port="0" to-layer="8341" to-port="0" /> + <edge from-layer="8341" from-port="1" to-layer="8342" to-port="1" /> + <edge from-layer="8342" from-port="2" to-layer="8344" to-port="0" /> + <edge from-layer="8343" from-port="0" to-layer="8344" to-port="1" /> + <edge from-layer="8344" from-port="2" to-layer="8346" to-port="0" /> + <edge from-layer="8345" from-port="0" to-layer="8346" to-port="1" /> + <edge from-layer="8346" from-port="2" to-layer="8347" to-port="0" /> + <edge from-layer="8347" from-port="1" to-layer="8348" to-port="1" /> + <edge from-layer="8348" from-port="2" to-layer="8351" to-port="0" /> + <edge from-layer="8349" from-port="0" to-layer="8350" to-port="0" /> + <edge from-layer="8350" from-port="1" to-layer="8351" to-port="1" /> + <edge from-layer="8351" from-port="2" to-layer="8353" to-port="0" /> + <edge from-layer="8352" from-port="0" to-layer="8353" to-port="1" /> + <edge from-layer="8353" from-port="2" to-layer="8355" to-port="0" /> + <edge from-layer="8354" from-port="0" to-layer="8355" to-port="1" /> + <edge from-layer="8355" from-port="2" to-layer="8367" to-port="0" /> + <edge from-layer="8355" from-port="2" to-layer="8373" to-port="0" /> + <edge from-layer="8355" from-port="2" to-layer="8357" to-port="0" /> + <edge from-layer="8355" from-port="2" to-layer="8356" to-port="0" /> + <edge from-layer="8356" from-port="2" to-layer="8376" to-port="0" /> + <edge from-layer="8357" from-port="1" to-layer="8359" to-port="0" /> + <edge from-layer="8358" from-port="0" to-layer="8359" to-port="2" /> + <edge from-layer="8359" from-port="3" to-layer="8360" to-port="0" /> + <edge from-layer="8360" from-port="2" to-layer="8361" to-port="0" /> + <edge from-layer="8361" from-port="1" to-layer="8363" to-port="0" /> + <edge from-layer="8362" from-port="0" to-layer="8363" to-port="1" /> + <edge from-layer="8363" from-port="2" to-layer="8367" to-port="1" /> + <edge from-layer="8363" from-port="2" to-layer="8373" to-port="2" /> + <edge from-layer="8364" from-port="0" to-layer="8367" to-port="2" /> + <edge from-layer="8365" from-port="0" to-layer="8367" to-port="3" /> + <edge from-layer="8366" from-port="0" to-layer="8367" to-port="4" /> + <edge from-layer="8367" from-port="5" to-layer="8369" to-port="0" /> + <edge from-layer="8368" from-port="0" to-layer="8369" to-port="1" /> + <edge from-layer="8369" from-port="2" to-layer="8374" to-port="0" /> + <edge from-layer="8370" from-port="0" to-layer="8373" to-port="1" /> + <edge from-layer="8371" from-port="0" to-layer="8373" to-port="3" /> + <edge from-layer="8372" from-port="0" to-layer="8373" to-port="4" /> + <edge from-layer="8373" from-port="5" to-layer="8374" to-port="1" /> + <edge from-layer="8374" from-port="2" to-layer="8375" to-port="0" /> + <edge from-layer="8375" from-port="2" to-layer="8376" to-port="1" /> + <edge from-layer="8376" from-port="2" to-layer="8377" to-port="1" /> + <edge from-layer="8376" from-port="2" to-layer="8437" to-port="0" /> + <edge from-layer="8377" from-port="2" to-layer="11168" to-port="0" /> + <edge from-layer="8377" from-port="2" to-layer="8378" to-port="0" /> + <edge from-layer="8377" from-port="2" to-layer="8379" to-port="0" /> + <edge from-layer="8378" from-port="2" to-layer="8388" to-port="0" /> + <edge from-layer="8379" from-port="1" to-layer="8386" to-port="0" /> + <edge from-layer="8379" from-port="1" to-layer="8382" to-port="0" /> + <edge from-layer="8380" from-port="0" to-layer="8382" to-port="1" /> + <edge from-layer="8381" from-port="0" to-layer="8382" to-port="2" /> + <edge from-layer="8382" from-port="3" to-layer="8387" to-port="0" /> + <edge from-layer="8383" from-port="0" to-layer="8387" to-port="1" /> + <edge from-layer="8384" from-port="0" to-layer="8386" to-port="1" /> + <edge from-layer="8385" from-port="0" to-layer="8386" to-port="2" /> + <edge from-layer="8386" from-port="3" to-layer="8387" to-port="2" /> + <edge from-layer="8387" from-port="3" to-layer="8388" to-port="1" /> + <edge from-layer="8388" from-port="2" to-layer="8390" to-port="0" /> + <edge from-layer="8389" from-port="0" to-layer="8390" to-port="1" /> + <edge from-layer="8390" from-port="2" to-layer="8445" to-port="1" /> + <edge from-layer="8391" from-port="0" to-layer="8396" to-port="0" /> + <edge from-layer="8392" from-port="0" to-layer="8395" to-port="1" /> + <edge from-layer="8393" from-port="0" to-layer="8395" to-port="2" /> + <edge from-layer="8394" from-port="0" to-layer="8395" to-port="3" /> + <edge from-layer="8395" from-port="4" to-layer="8396" to-port="1" /> + <edge from-layer="8396" from-port="2" to-layer="8397" to-port="0" /> + <edge from-layer="8397" from-port="1" to-layer="8399" to-port="0" /> + <edge from-layer="8398" from-port="0" to-layer="8399" to-port="2" /> + <edge from-layer="8399" from-port="3" to-layer="8418" to-port="0" /> + <edge from-layer="8400" from-port="0" to-layer="8401" to-port="0" /> + <edge from-layer="8401" from-port="1" to-layer="8404" to-port="0" /> + <edge from-layer="8402" from-port="0" to-layer="8403" to-port="0" /> + <edge from-layer="8403" from-port="1" to-layer="8404" to-port="1" /> + <edge from-layer="8404" from-port="2" to-layer="8406" to-port="0" /> + <edge from-layer="8405" from-port="0" to-layer="8406" to-port="1" /> + <edge from-layer="8406" from-port="2" to-layer="8408" to-port="0" /> + <edge from-layer="8407" from-port="0" to-layer="8408" to-port="1" /> + <edge from-layer="8408" from-port="2" to-layer="8409" to-port="0" /> + <edge from-layer="8409" from-port="1" to-layer="8410" to-port="1" /> + <edge from-layer="8410" from-port="2" to-layer="8413" to-port="0" /> + <edge from-layer="8411" from-port="0" to-layer="8412" to-port="0" /> + <edge from-layer="8412" from-port="1" to-layer="8413" to-port="1" /> + <edge from-layer="8413" from-port="2" to-layer="8415" to-port="0" /> + <edge from-layer="8414" from-port="0" to-layer="8415" to-port="1" /> + <edge from-layer="8415" from-port="2" to-layer="8417" to-port="0" /> + <edge from-layer="8416" from-port="0" to-layer="8417" to-port="1" /> + <edge from-layer="8417" from-port="2" to-layer="8418" to-port="1" /> + <edge from-layer="8418" from-port="2" to-layer="11167" to-port="0" /> + <edge from-layer="8418" from-port="2" to-layer="8419" to-port="0" /> + <edge from-layer="8418" from-port="2" to-layer="8420" to-port="0" /> + <edge from-layer="8419" from-port="2" to-layer="8429" to-port="0" /> + <edge from-layer="8420" from-port="1" to-layer="8423" to-port="0" /> + <edge from-layer="8420" from-port="1" to-layer="8427" to-port="0" /> + <edge from-layer="8421" from-port="0" to-layer="8423" to-port="1" /> + <edge from-layer="8422" from-port="0" to-layer="8423" to-port="2" /> + <edge from-layer="8423" from-port="3" to-layer="8428" to-port="1" /> + <edge from-layer="8424" from-port="0" to-layer="8428" to-port="2" /> + <edge from-layer="8425" from-port="0" to-layer="8427" to-port="1" /> + <edge from-layer="8426" from-port="0" to-layer="8427" to-port="2" /> + <edge from-layer="8427" from-port="3" to-layer="8428" to-port="3" /> + <edge from-layer="8428" from-port="4" to-layer="8429" to-port="1" /> + <edge from-layer="8429" from-port="2" to-layer="8431" to-port="0" /> + <edge from-layer="8430" from-port="0" to-layer="8431" to-port="1" /> + <edge from-layer="8431" from-port="2" to-layer="8445" to-port="2" /> + <edge from-layer="8432" from-port="0" to-layer="8444" to-port="1" /> + <edge from-layer="8433" from-port="1" to-layer="8436" to-port="0" /> + <edge from-layer="8434" from-port="0" to-layer="8436" to-port="1" /> + <edge from-layer="8435" from-port="0" to-layer="8436" to-port="2" /> + <edge from-layer="8436" from-port="3" to-layer="8441" to-port="0" /> + <edge from-layer="8437" from-port="1" to-layer="8440" to-port="0" /> + <edge from-layer="8438" from-port="0" to-layer="8440" to-port="1" /> + <edge from-layer="8439" from-port="0" to-layer="8440" to-port="2" /> + <edge from-layer="8440" from-port="3" to-layer="8441" to-port="1" /> + <edge from-layer="8441" from-port="2" to-layer="8444" to-port="2" /> + <edge from-layer="8442" from-port="0" to-layer="8444" to-port="3" /> + <edge from-layer="8443" from-port="0" to-layer="8444" to-port="4" /> + <edge from-layer="8444" from-port="5" to-layer="8445" to-port="3" /> + <edge from-layer="8445" from-port="4" to-layer="8447" to-port="0" /> + <edge from-layer="8446" from-port="0" to-layer="8447" to-port="1" /> + <edge from-layer="8447" from-port="2" to-layer="8449" to-port="0" /> + <edge from-layer="8448" from-port="0" to-layer="8449" to-port="1" /> + <edge from-layer="8449" from-port="2" to-layer="8460" to-port="0" /> + <edge from-layer="8450" from-port="0" to-layer="8451" to-port="0" /> + <edge from-layer="8451" from-port="1" to-layer="8454" to-port="0" /> + <edge from-layer="8452" from-port="0" to-layer="8453" to-port="0" /> + <edge from-layer="8453" from-port="1" to-layer="8454" to-port="1" /> + <edge from-layer="8454" from-port="2" to-layer="8456" to-port="0" /> + <edge from-layer="8455" from-port="0" to-layer="8456" to-port="1" /> + <edge from-layer="8456" from-port="2" to-layer="8458" to-port="0" /> + <edge from-layer="8457" from-port="0" to-layer="8458" to-port="1" /> + <edge from-layer="8458" from-port="2" to-layer="8459" to-port="0" /> + <edge from-layer="8459" from-port="1" to-layer="8460" to-port="1" /> + <edge from-layer="8460" from-port="2" to-layer="8461" to-port="1" /> + <edge from-layer="8461" from-port="2" to-layer="8472" to-port="0" /> + <edge from-layer="8461" from-port="2" to-layer="8509" to-port="0" /> + <edge from-layer="8461" from-port="2" to-layer="8465" to-port="0" /> + <edge from-layer="8462" from-port="0" to-layer="8473" to-port="0" /> + <edge from-layer="8463" from-port="0" to-layer="8471" to-port="0" /> + <edge from-layer="8464" from-port="0" to-layer="8465" to-port="1" /> + <edge from-layer="8465" from-port="2" to-layer="8467" to-port="0" /> + <edge from-layer="8466" from-port="0" to-layer="8467" to-port="1" /> + <edge from-layer="8467" from-port="2" to-layer="8469" to-port="0" /> + <edge from-layer="8468" from-port="0" to-layer="8469" to-port="1" /> + <edge from-layer="8469" from-port="2" to-layer="8470" to-port="0" /> + <edge from-layer="8470" from-port="1" to-layer="8471" to-port="1" /> + <edge from-layer="8471" from-port="2" to-layer="8472" to-port="1" /> + <edge from-layer="8472" from-port="2" to-layer="8473" to-port="1" /> + <edge from-layer="8473" from-port="2" to-layer="8496" to-port="0" /> + <edge from-layer="8473" from-port="2" to-layer="8484" to-port="0" /> + <edge from-layer="8474" from-port="0" to-layer="8475" to-port="0" /> + <edge from-layer="8475" from-port="1" to-layer="8478" to-port="0" /> + <edge from-layer="8476" from-port="0" to-layer="8477" to-port="0" /> + <edge from-layer="8477" from-port="1" to-layer="8478" to-port="1" /> + <edge from-layer="8478" from-port="2" to-layer="8480" to-port="0" /> + <edge from-layer="8479" from-port="0" to-layer="8480" to-port="1" /> + <edge from-layer="8480" from-port="2" to-layer="8482" to-port="0" /> + <edge from-layer="8481" from-port="0" to-layer="8482" to-port="1" /> + <edge from-layer="8482" from-port="2" to-layer="8483" to-port="0" /> + <edge from-layer="8483" from-port="1" to-layer="8484" to-port="1" /> + <edge from-layer="8484" from-port="2" to-layer="8485" to-port="0" /> + <edge from-layer="8485" from-port="1" to-layer="8497" to-port="0" /> + <edge from-layer="8486" from-port="0" to-layer="8487" to-port="0" /> + <edge from-layer="8487" from-port="1" to-layer="8490" to-port="0" /> + <edge from-layer="8488" from-port="0" to-layer="8489" to-port="0" /> + <edge from-layer="8489" from-port="1" to-layer="8490" to-port="1" /> + <edge from-layer="8490" from-port="2" to-layer="8492" to-port="0" /> + <edge from-layer="8491" from-port="0" to-layer="8492" to-port="1" /> + <edge from-layer="8492" from-port="2" to-layer="8494" to-port="0" /> + <edge from-layer="8493" from-port="0" to-layer="8494" to-port="1" /> + <edge from-layer="8494" from-port="2" to-layer="8495" to-port="0" /> + <edge from-layer="8495" from-port="1" to-layer="8496" to-port="1" /> + <edge from-layer="8496" from-port="2" to-layer="8497" to-port="1" /> + <edge from-layer="8497" from-port="2" to-layer="8508" to-port="0" /> + <edge from-layer="8498" from-port="0" to-layer="8499" to-port="0" /> + <edge from-layer="8499" from-port="1" to-layer="8502" to-port="0" /> + <edge from-layer="8500" from-port="0" to-layer="8501" to-port="0" /> + <edge from-layer="8501" from-port="1" to-layer="8502" to-port="1" /> + <edge from-layer="8502" from-port="2" to-layer="8504" to-port="0" /> + <edge from-layer="8503" from-port="0" to-layer="8504" to-port="1" /> + <edge from-layer="8504" from-port="2" to-layer="8506" to-port="0" /> + <edge from-layer="8505" from-port="0" to-layer="8506" to-port="1" /> + <edge from-layer="8506" from-port="2" to-layer="8507" to-port="0" /> + <edge from-layer="8507" from-port="1" to-layer="8508" to-port="1" /> + <edge from-layer="8508" from-port="2" to-layer="8509" to-port="1" /> + <edge from-layer="8509" from-port="2" to-layer="8693" to-port="0" /> + <edge from-layer="8509" from-port="2" to-layer="8513" to-port="0" /> + <edge from-layer="8509" from-port="2" to-layer="8520" to-port="0" /> + <edge from-layer="8510" from-port="0" to-layer="8521" to-port="0" /> + <edge from-layer="8511" from-port="0" to-layer="8519" to-port="0" /> + <edge from-layer="8512" from-port="0" to-layer="8513" to-port="1" /> + <edge from-layer="8513" from-port="2" to-layer="8515" to-port="0" /> + <edge from-layer="8514" from-port="0" to-layer="8515" to-port="1" /> + <edge from-layer="8515" from-port="2" to-layer="8517" to-port="0" /> + <edge from-layer="8516" from-port="0" to-layer="8517" to-port="1" /> + <edge from-layer="8517" from-port="2" to-layer="8518" to-port="0" /> + <edge from-layer="8518" from-port="1" to-layer="8519" to-port="1" /> + <edge from-layer="8519" from-port="2" to-layer="8520" to-port="1" /> + <edge from-layer="8520" from-port="2" to-layer="8521" to-port="1" /> + <edge from-layer="8521" from-port="2" to-layer="8580" to-port="0" /> + <edge from-layer="8521" from-port="2" to-layer="8532" to-port="0" /> + <edge from-layer="8521" from-port="2" to-layer="8642" to-port="0" /> + <edge from-layer="8522" from-port="0" to-layer="8523" to-port="0" /> + <edge from-layer="8523" from-port="1" to-layer="8526" to-port="0" /> + <edge from-layer="8524" from-port="0" to-layer="8525" to-port="0" /> + <edge from-layer="8525" from-port="1" to-layer="8526" to-port="1" /> + <edge from-layer="8526" from-port="2" to-layer="8528" to-port="0" /> + <edge from-layer="8527" from-port="0" to-layer="8528" to-port="1" /> + <edge from-layer="8528" from-port="2" to-layer="8530" to-port="0" /> + <edge from-layer="8529" from-port="0" to-layer="8530" to-port="1" /> + <edge from-layer="8530" from-port="2" to-layer="8531" to-port="0" /> + <edge from-layer="8531" from-port="1" to-layer="8532" to-port="1" /> + <edge from-layer="8532" from-port="2" to-layer="8535" to-port="0" /> + <edge from-layer="8533" from-port="0" to-layer="8534" to-port="0" /> + <edge from-layer="8534" from-port="1" to-layer="8535" to-port="1" /> + <edge from-layer="8535" from-port="2" to-layer="8537" to-port="0" /> + <edge from-layer="8536" from-port="0" to-layer="8537" to-port="1" /> + <edge from-layer="8537" from-port="2" to-layer="8539" to-port="0" /> + <edge from-layer="8538" from-port="0" to-layer="8539" to-port="1" /> + <edge from-layer="8539" from-port="2" to-layer="8540" to-port="0" /> + <edge from-layer="8539" from-port="2" to-layer="8541" to-port="0" /> + <edge from-layer="8539" from-port="2" to-layer="8557" to-port="0" /> + <edge from-layer="8539" from-port="2" to-layer="8551" to-port="0" /> + <edge from-layer="8540" from-port="2" to-layer="8560" to-port="0" /> + <edge from-layer="8541" from-port="1" to-layer="8543" to-port="0" /> + <edge from-layer="8542" from-port="0" to-layer="8543" to-port="2" /> + <edge from-layer="8543" from-port="3" to-layer="8544" to-port="0" /> + <edge from-layer="8544" from-port="2" to-layer="8545" to-port="0" /> + <edge from-layer="8545" from-port="1" to-layer="8547" to-port="0" /> + <edge from-layer="8546" from-port="0" to-layer="8547" to-port="1" /> + <edge from-layer="8547" from-port="2" to-layer="8551" to-port="1" /> + <edge from-layer="8547" from-port="2" to-layer="8557" to-port="2" /> + <edge from-layer="8548" from-port="0" to-layer="8551" to-port="2" /> + <edge from-layer="8549" from-port="0" to-layer="8551" to-port="3" /> + <edge from-layer="8550" from-port="0" to-layer="8551" to-port="4" /> + <edge from-layer="8551" from-port="5" to-layer="8553" to-port="0" /> + <edge from-layer="8552" from-port="0" to-layer="8553" to-port="1" /> + <edge from-layer="8553" from-port="2" to-layer="8558" to-port="0" /> + <edge from-layer="8554" from-port="0" to-layer="8557" to-port="1" /> + <edge from-layer="8555" from-port="0" to-layer="8557" to-port="3" /> + <edge from-layer="8556" from-port="0" to-layer="8557" to-port="4" /> + <edge from-layer="8557" from-port="5" to-layer="8558" to-port="1" /> + <edge from-layer="8558" from-port="2" to-layer="8559" to-port="0" /> + <edge from-layer="8559" from-port="2" to-layer="8560" to-port="1" /> + <edge from-layer="8560" from-port="2" to-layer="8677" to-port="0" /> + <edge from-layer="8561" from-port="0" to-layer="8566" to-port="0" /> + <edge from-layer="8562" from-port="0" to-layer="8565" to-port="1" /> + <edge from-layer="8563" from-port="0" to-layer="8565" to-port="2" /> + <edge from-layer="8564" from-port="0" to-layer="8565" to-port="3" /> + <edge from-layer="8565" from-port="4" to-layer="8566" to-port="1" /> + <edge from-layer="8566" from-port="2" to-layer="8567" to-port="0" /> + <edge from-layer="8567" from-port="1" to-layer="8569" to-port="0" /> + <edge from-layer="8568" from-port="0" to-layer="8569" to-port="2" /> + <edge from-layer="8569" from-port="3" to-layer="8609" to-port="0" /> + <edge from-layer="8569" from-port="3" to-layer="8665" to-port="0" /> + <edge from-layer="8570" from-port="0" to-layer="8571" to-port="0" /> + <edge from-layer="8571" from-port="1" to-layer="8574" to-port="0" /> + <edge from-layer="8572" from-port="0" to-layer="8573" to-port="0" /> + <edge from-layer="8573" from-port="1" to-layer="8574" to-port="1" /> + <edge from-layer="8574" from-port="2" to-layer="8576" to-port="0" /> + <edge from-layer="8575" from-port="0" to-layer="8576" to-port="1" /> + <edge from-layer="8576" from-port="2" to-layer="8578" to-port="0" /> + <edge from-layer="8577" from-port="0" to-layer="8578" to-port="1" /> + <edge from-layer="8578" from-port="2" to-layer="8579" to-port="0" /> + <edge from-layer="8579" from-port="1" to-layer="8580" to-port="1" /> + <edge from-layer="8580" from-port="2" to-layer="8583" to-port="0" /> + <edge from-layer="8581" from-port="0" to-layer="8582" to-port="0" /> + <edge from-layer="8582" from-port="1" to-layer="8583" to-port="1" /> + <edge from-layer="8583" from-port="2" to-layer="8585" to-port="0" /> + <edge from-layer="8584" from-port="0" to-layer="8585" to-port="1" /> + <edge from-layer="8585" from-port="2" to-layer="8587" to-port="0" /> + <edge from-layer="8586" from-port="0" to-layer="8587" to-port="1" /> + <edge from-layer="8587" from-port="2" to-layer="8588" to-port="0" /> + <edge from-layer="8587" from-port="2" to-layer="8589" to-port="0" /> + <edge from-layer="8587" from-port="2" to-layer="8605" to-port="0" /> + <edge from-layer="8587" from-port="2" to-layer="8599" to-port="0" /> + <edge from-layer="8588" from-port="2" to-layer="8608" to-port="0" /> + <edge from-layer="8589" from-port="1" to-layer="8591" to-port="0" /> + <edge from-layer="8590" from-port="0" to-layer="8591" to-port="2" /> + <edge from-layer="8591" from-port="3" to-layer="8592" to-port="0" /> + <edge from-layer="8592" from-port="2" to-layer="8593" to-port="0" /> + <edge from-layer="8593" from-port="1" to-layer="8595" to-port="0" /> + <edge from-layer="8594" from-port="0" to-layer="8595" to-port="1" /> + <edge from-layer="8595" from-port="2" to-layer="8599" to-port="1" /> + <edge from-layer="8595" from-port="2" to-layer="8605" to-port="2" /> + <edge from-layer="8596" from-port="0" to-layer="8599" to-port="2" /> + <edge from-layer="8597" from-port="0" to-layer="8599" to-port="3" /> + <edge from-layer="8598" from-port="0" to-layer="8599" to-port="4" /> + <edge from-layer="8599" from-port="5" to-layer="8601" to-port="0" /> + <edge from-layer="8600" from-port="0" to-layer="8601" to-port="1" /> + <edge from-layer="8601" from-port="2" to-layer="8606" to-port="0" /> + <edge from-layer="8602" from-port="0" to-layer="8605" to-port="1" /> + <edge from-layer="8603" from-port="0" to-layer="8605" to-port="3" /> + <edge from-layer="8604" from-port="0" to-layer="8605" to-port="4" /> + <edge from-layer="8605" from-port="5" to-layer="8606" to-port="1" /> + <edge from-layer="8606" from-port="2" to-layer="8607" to-port="0" /> + <edge from-layer="8607" from-port="2" to-layer="8608" to-port="1" /> + <edge from-layer="8608" from-port="2" to-layer="8669" to-port="0" /> + <edge from-layer="8608" from-port="2" to-layer="8609" to-port="1" /> + <edge from-layer="8609" from-port="2" to-layer="11166" to-port="0" /> + <edge from-layer="8609" from-port="2" to-layer="8611" to-port="0" /> + <edge from-layer="8609" from-port="2" to-layer="8610" to-port="0" /> + <edge from-layer="8610" from-port="2" to-layer="8620" to-port="0" /> + <edge from-layer="8611" from-port="1" to-layer="8614" to-port="0" /> + <edge from-layer="8611" from-port="1" to-layer="8618" to-port="0" /> + <edge from-layer="8612" from-port="0" to-layer="8614" to-port="1" /> + <edge from-layer="8613" from-port="0" to-layer="8614" to-port="2" /> + <edge from-layer="8614" from-port="3" to-layer="8619" to-port="0" /> + <edge from-layer="8615" from-port="0" to-layer="8619" to-port="1" /> + <edge from-layer="8616" from-port="0" to-layer="8618" to-port="1" /> + <edge from-layer="8617" from-port="0" to-layer="8618" to-port="2" /> + <edge from-layer="8618" from-port="3" to-layer="8619" to-port="2" /> + <edge from-layer="8619" from-port="3" to-layer="8620" to-port="1" /> + <edge from-layer="8620" from-port="2" to-layer="8622" to-port="0" /> + <edge from-layer="8621" from-port="0" to-layer="8622" to-port="1" /> + <edge from-layer="8622" from-port="2" to-layer="8677" to-port="1" /> + <edge from-layer="8623" from-port="0" to-layer="8628" to-port="0" /> + <edge from-layer="8624" from-port="0" to-layer="8627" to-port="1" /> + <edge from-layer="8625" from-port="0" to-layer="8627" to-port="2" /> + <edge from-layer="8626" from-port="0" to-layer="8627" to-port="3" /> + <edge from-layer="8627" from-port="4" to-layer="8628" to-port="1" /> + <edge from-layer="8628" from-port="2" to-layer="8629" to-port="0" /> + <edge from-layer="8629" from-port="1" to-layer="8631" to-port="0" /> + <edge from-layer="8630" from-port="0" to-layer="8631" to-port="2" /> + <edge from-layer="8631" from-port="3" to-layer="8650" to-port="0" /> + <edge from-layer="8632" from-port="0" to-layer="8633" to-port="0" /> + <edge from-layer="8633" from-port="1" to-layer="8636" to-port="0" /> + <edge from-layer="8634" from-port="0" to-layer="8635" to-port="0" /> + <edge from-layer="8635" from-port="1" to-layer="8636" to-port="1" /> + <edge from-layer="8636" from-port="2" to-layer="8638" to-port="0" /> + <edge from-layer="8637" from-port="0" to-layer="8638" to-port="1" /> + <edge from-layer="8638" from-port="2" to-layer="8640" to-port="0" /> + <edge from-layer="8639" from-port="0" to-layer="8640" to-port="1" /> + <edge from-layer="8640" from-port="2" to-layer="8641" to-port="0" /> + <edge from-layer="8641" from-port="1" to-layer="8642" to-port="1" /> + <edge from-layer="8642" from-port="2" to-layer="8645" to-port="0" /> + <edge from-layer="8643" from-port="0" to-layer="8644" to-port="0" /> + <edge from-layer="8644" from-port="1" to-layer="8645" to-port="1" /> + <edge from-layer="8645" from-port="2" to-layer="8647" to-port="0" /> + <edge from-layer="8646" from-port="0" to-layer="8647" to-port="1" /> + <edge from-layer="8647" from-port="2" to-layer="8649" to-port="0" /> + <edge from-layer="8648" from-port="0" to-layer="8649" to-port="1" /> + <edge from-layer="8649" from-port="2" to-layer="8650" to-port="1" /> + <edge from-layer="8650" from-port="2" to-layer="8652" to-port="0" /> + <edge from-layer="8650" from-port="2" to-layer="11165" to-port="0" /> + <edge from-layer="8650" from-port="2" to-layer="8651" to-port="0" /> + <edge from-layer="8651" from-port="2" to-layer="8661" to-port="0" /> + <edge from-layer="8652" from-port="1" to-layer="8659" to-port="0" /> + <edge from-layer="8652" from-port="1" to-layer="8655" to-port="0" /> + <edge from-layer="8653" from-port="0" to-layer="8655" to-port="1" /> + <edge from-layer="8654" from-port="0" to-layer="8655" to-port="2" /> + <edge from-layer="8655" from-port="3" to-layer="8660" to-port="1" /> + <edge from-layer="8656" from-port="0" to-layer="8660" to-port="2" /> + <edge from-layer="8657" from-port="0" to-layer="8659" to-port="1" /> + <edge from-layer="8658" from-port="0" to-layer="8659" to-port="2" /> + <edge from-layer="8659" from-port="3" to-layer="8660" to-port="3" /> + <edge from-layer="8660" from-port="4" to-layer="8661" to-port="1" /> + <edge from-layer="8661" from-port="2" to-layer="8663" to-port="0" /> + <edge from-layer="8662" from-port="0" to-layer="8663" to-port="1" /> + <edge from-layer="8663" from-port="2" to-layer="8677" to-port="2" /> + <edge from-layer="8664" from-port="0" to-layer="8676" to-port="1" /> + <edge from-layer="8665" from-port="1" to-layer="8668" to-port="0" /> + <edge from-layer="8666" from-port="0" to-layer="8668" to-port="1" /> + <edge from-layer="8667" from-port="0" to-layer="8668" to-port="2" /> + <edge from-layer="8668" from-port="3" to-layer="8673" to-port="0" /> + <edge from-layer="8669" from-port="1" to-layer="8672" to-port="0" /> + <edge from-layer="8670" from-port="0" to-layer="8672" to-port="1" /> + <edge from-layer="8671" from-port="0" to-layer="8672" to-port="2" /> + <edge from-layer="8672" from-port="3" to-layer="8673" to-port="1" /> + <edge from-layer="8673" from-port="2" to-layer="8676" to-port="2" /> + <edge from-layer="8674" from-port="0" to-layer="8676" to-port="3" /> + <edge from-layer="8675" from-port="0" to-layer="8676" to-port="4" /> + <edge from-layer="8676" from-port="5" to-layer="8677" to-port="3" /> + <edge from-layer="8677" from-port="4" to-layer="8679" to-port="0" /> + <edge from-layer="8678" from-port="0" to-layer="8679" to-port="1" /> + <edge from-layer="8679" from-port="2" to-layer="8681" to-port="0" /> + <edge from-layer="8680" from-port="0" to-layer="8681" to-port="1" /> + <edge from-layer="8681" from-port="2" to-layer="8692" to-port="0" /> + <edge from-layer="8682" from-port="0" to-layer="8683" to-port="0" /> + <edge from-layer="8683" from-port="1" to-layer="8686" to-port="0" /> + <edge from-layer="8684" from-port="0" to-layer="8685" to-port="0" /> + <edge from-layer="8685" from-port="1" to-layer="8686" to-port="1" /> + <edge from-layer="8686" from-port="2" to-layer="8688" to-port="0" /> + <edge from-layer="8687" from-port="0" to-layer="8688" to-port="1" /> + <edge from-layer="8688" from-port="2" to-layer="8690" to-port="0" /> + <edge from-layer="8689" from-port="0" to-layer="8690" to-port="1" /> + <edge from-layer="8690" from-port="2" to-layer="8691" to-port="0" /> + <edge from-layer="8691" from-port="1" to-layer="8692" to-port="1" /> + <edge from-layer="8692" from-port="2" to-layer="8693" to-port="1" /> + <edge from-layer="8693" from-port="2" to-layer="8741" to-port="0" /> + <edge from-layer="8693" from-port="2" to-layer="8704" to-port="0" /> + <edge from-layer="8693" from-port="2" to-layer="8697" to-port="0" /> + <edge from-layer="8694" from-port="0" to-layer="8705" to-port="0" /> + <edge from-layer="8695" from-port="0" to-layer="8703" to-port="0" /> + <edge from-layer="8696" from-port="0" to-layer="8697" to-port="1" /> + <edge from-layer="8697" from-port="2" to-layer="8699" to-port="0" /> + <edge from-layer="8698" from-port="0" to-layer="8699" to-port="1" /> + <edge from-layer="8699" from-port="2" to-layer="8701" to-port="0" /> + <edge from-layer="8700" from-port="0" to-layer="8701" to-port="1" /> + <edge from-layer="8701" from-port="2" to-layer="8702" to-port="0" /> + <edge from-layer="8702" from-port="1" to-layer="8703" to-port="1" /> + <edge from-layer="8703" from-port="2" to-layer="8704" to-port="1" /> + <edge from-layer="8704" from-port="2" to-layer="8705" to-port="1" /> + <edge from-layer="8705" from-port="2" to-layer="8728" to-port="0" /> + <edge from-layer="8705" from-port="2" to-layer="8716" to-port="0" /> + <edge from-layer="8706" from-port="0" to-layer="8707" to-port="0" /> + <edge from-layer="8707" from-port="1" to-layer="8710" to-port="0" /> + <edge from-layer="8708" from-port="0" to-layer="8709" to-port="0" /> + <edge from-layer="8709" from-port="1" to-layer="8710" to-port="1" /> + <edge from-layer="8710" from-port="2" to-layer="8712" to-port="0" /> + <edge from-layer="8711" from-port="0" to-layer="8712" to-port="1" /> + <edge from-layer="8712" from-port="2" to-layer="8714" to-port="0" /> + <edge from-layer="8713" from-port="0" to-layer="8714" to-port="1" /> + <edge from-layer="8714" from-port="2" to-layer="8715" to-port="0" /> + <edge from-layer="8715" from-port="1" to-layer="8716" to-port="1" /> + <edge from-layer="8716" from-port="2" to-layer="8717" to-port="0" /> + <edge from-layer="8717" from-port="1" to-layer="8729" to-port="0" /> + <edge from-layer="8718" from-port="0" to-layer="8719" to-port="0" /> + <edge from-layer="8719" from-port="1" to-layer="8722" to-port="0" /> + <edge from-layer="8720" from-port="0" to-layer="8721" to-port="0" /> + <edge from-layer="8721" from-port="1" to-layer="8722" to-port="1" /> + <edge from-layer="8722" from-port="2" to-layer="8724" to-port="0" /> + <edge from-layer="8723" from-port="0" to-layer="8724" to-port="1" /> + <edge from-layer="8724" from-port="2" to-layer="8726" to-port="0" /> + <edge from-layer="8725" from-port="0" to-layer="8726" to-port="1" /> + <edge from-layer="8726" from-port="2" to-layer="8727" to-port="0" /> + <edge from-layer="8727" from-port="1" to-layer="8728" to-port="1" /> + <edge from-layer="8728" from-port="2" to-layer="8729" to-port="1" /> + <edge from-layer="8729" from-port="2" to-layer="8740" to-port="0" /> + <edge from-layer="8730" from-port="0" to-layer="8731" to-port="0" /> + <edge from-layer="8731" from-port="1" to-layer="8734" to-port="0" /> + <edge from-layer="8732" from-port="0" to-layer="8733" to-port="0" /> + <edge from-layer="8733" from-port="1" to-layer="8734" to-port="1" /> + <edge from-layer="8734" from-port="2" to-layer="8736" to-port="0" /> + <edge from-layer="8735" from-port="0" to-layer="8736" to-port="1" /> + <edge from-layer="8736" from-port="2" to-layer="8738" to-port="0" /> + <edge from-layer="8737" from-port="0" to-layer="8738" to-port="1" /> + <edge from-layer="8738" from-port="2" to-layer="8739" to-port="0" /> + <edge from-layer="8739" from-port="1" to-layer="8740" to-port="1" /> + <edge from-layer="8740" from-port="2" to-layer="8741" to-port="1" /> + <edge from-layer="8741" from-port="2" to-layer="8745" to-port="0" /> + <edge from-layer="8741" from-port="2" to-layer="8752" to-port="0" /> + <edge from-layer="8741" from-port="2" to-layer="8925" to-port="0" /> + <edge from-layer="8742" from-port="0" to-layer="8753" to-port="0" /> + <edge from-layer="8743" from-port="0" to-layer="8751" to-port="0" /> + <edge from-layer="8744" from-port="0" to-layer="8745" to-port="1" /> + <edge from-layer="8745" from-port="2" to-layer="8747" to-port="0" /> + <edge from-layer="8746" from-port="0" to-layer="8747" to-port="1" /> + <edge from-layer="8747" from-port="2" to-layer="8749" to-port="0" /> + <edge from-layer="8748" from-port="0" to-layer="8749" to-port="1" /> + <edge from-layer="8749" from-port="2" to-layer="8750" to-port="0" /> + <edge from-layer="8750" from-port="1" to-layer="8751" to-port="1" /> + <edge from-layer="8751" from-port="2" to-layer="8752" to-port="1" /> + <edge from-layer="8752" from-port="2" to-layer="8753" to-port="1" /> + <edge from-layer="8753" from-port="2" to-layer="8764" to-port="0" /> + <edge from-layer="8753" from-port="2" to-layer="8874" to-port="0" /> + <edge from-layer="8753" from-port="2" to-layer="8812" to-port="0" /> + <edge from-layer="8754" from-port="0" to-layer="8755" to-port="0" /> + <edge from-layer="8755" from-port="1" to-layer="8758" to-port="0" /> + <edge from-layer="8756" from-port="0" to-layer="8757" to-port="0" /> + <edge from-layer="8757" from-port="1" to-layer="8758" to-port="1" /> + <edge from-layer="8758" from-port="2" to-layer="8760" to-port="0" /> + <edge from-layer="8759" from-port="0" to-layer="8760" to-port="1" /> + <edge from-layer="8760" from-port="2" to-layer="8762" to-port="0" /> + <edge from-layer="8761" from-port="0" to-layer="8762" to-port="1" /> + <edge from-layer="8762" from-port="2" to-layer="8763" to-port="0" /> + <edge from-layer="8763" from-port="1" to-layer="8764" to-port="1" /> + <edge from-layer="8764" from-port="2" to-layer="8767" to-port="0" /> + <edge from-layer="8765" from-port="0" to-layer="8766" to-port="0" /> + <edge from-layer="8766" from-port="1" to-layer="8767" to-port="1" /> + <edge from-layer="8767" from-port="2" to-layer="8769" to-port="0" /> + <edge from-layer="8768" from-port="0" to-layer="8769" to-port="1" /> + <edge from-layer="8769" from-port="2" to-layer="8771" to-port="0" /> + <edge from-layer="8770" from-port="0" to-layer="8771" to-port="1" /> + <edge from-layer="8771" from-port="2" to-layer="8783" to-port="0" /> + <edge from-layer="8771" from-port="2" to-layer="8772" to-port="0" /> + <edge from-layer="8771" from-port="2" to-layer="8773" to-port="0" /> + <edge from-layer="8771" from-port="2" to-layer="8789" to-port="0" /> + <edge from-layer="8772" from-port="2" to-layer="8792" to-port="0" /> + <edge from-layer="8773" from-port="1" to-layer="8775" to-port="0" /> + <edge from-layer="8774" from-port="0" to-layer="8775" to-port="2" /> + <edge from-layer="8775" from-port="3" to-layer="8776" to-port="0" /> + <edge from-layer="8776" from-port="2" to-layer="8777" to-port="0" /> + <edge from-layer="8777" from-port="1" to-layer="8779" to-port="0" /> + <edge from-layer="8778" from-port="0" to-layer="8779" to-port="1" /> + <edge from-layer="8779" from-port="2" to-layer="8783" to-port="1" /> + <edge from-layer="8779" from-port="2" to-layer="8789" to-port="2" /> + <edge from-layer="8780" from-port="0" to-layer="8783" to-port="2" /> + <edge from-layer="8781" from-port="0" to-layer="8783" to-port="3" /> + <edge from-layer="8782" from-port="0" to-layer="8783" to-port="4" /> + <edge from-layer="8783" from-port="5" to-layer="8785" to-port="0" /> + <edge from-layer="8784" from-port="0" to-layer="8785" to-port="1" /> + <edge from-layer="8785" from-port="2" to-layer="8790" to-port="0" /> + <edge from-layer="8786" from-port="0" to-layer="8789" to-port="1" /> + <edge from-layer="8787" from-port="0" to-layer="8789" to-port="3" /> + <edge from-layer="8788" from-port="0" to-layer="8789" to-port="4" /> + <edge from-layer="8789" from-port="5" to-layer="8790" to-port="1" /> + <edge from-layer="8790" from-port="2" to-layer="8791" to-port="0" /> + <edge from-layer="8791" from-port="2" to-layer="8792" to-port="1" /> + <edge from-layer="8792" from-port="2" to-layer="8909" to-port="0" /> + <edge from-layer="8793" from-port="0" to-layer="8798" to-port="0" /> + <edge from-layer="8794" from-port="0" to-layer="8797" to-port="1" /> + <edge from-layer="8795" from-port="0" to-layer="8797" to-port="2" /> + <edge from-layer="8796" from-port="0" to-layer="8797" to-port="3" /> + <edge from-layer="8797" from-port="4" to-layer="8798" to-port="1" /> + <edge from-layer="8798" from-port="2" to-layer="8799" to-port="0" /> + <edge from-layer="8799" from-port="1" to-layer="8801" to-port="0" /> + <edge from-layer="8800" from-port="0" to-layer="8801" to-port="2" /> + <edge from-layer="8801" from-port="3" to-layer="8897" to-port="0" /> + <edge from-layer="8801" from-port="3" to-layer="8841" to-port="0" /> + <edge from-layer="8802" from-port="0" to-layer="8803" to-port="0" /> + <edge from-layer="8803" from-port="1" to-layer="8806" to-port="0" /> + <edge from-layer="8804" from-port="0" to-layer="8805" to-port="0" /> + <edge from-layer="8805" from-port="1" to-layer="8806" to-port="1" /> + <edge from-layer="8806" from-port="2" to-layer="8808" to-port="0" /> + <edge from-layer="8807" from-port="0" to-layer="8808" to-port="1" /> + <edge from-layer="8808" from-port="2" to-layer="8810" to-port="0" /> + <edge from-layer="8809" from-port="0" to-layer="8810" to-port="1" /> + <edge from-layer="8810" from-port="2" to-layer="8811" to-port="0" /> + <edge from-layer="8811" from-port="1" to-layer="8812" to-port="1" /> + <edge from-layer="8812" from-port="2" to-layer="8815" to-port="0" /> + <edge from-layer="8813" from-port="0" to-layer="8814" to-port="0" /> + <edge from-layer="8814" from-port="1" to-layer="8815" to-port="1" /> + <edge from-layer="8815" from-port="2" to-layer="8817" to-port="0" /> + <edge from-layer="8816" from-port="0" to-layer="8817" to-port="1" /> + <edge from-layer="8817" from-port="2" to-layer="8819" to-port="0" /> + <edge from-layer="8818" from-port="0" to-layer="8819" to-port="1" /> + <edge from-layer="8819" from-port="2" to-layer="8831" to-port="0" /> + <edge from-layer="8819" from-port="2" to-layer="8837" to-port="0" /> + <edge from-layer="8819" from-port="2" to-layer="8820" to-port="0" /> + <edge from-layer="8819" from-port="2" to-layer="8821" to-port="0" /> + <edge from-layer="8820" from-port="2" to-layer="8840" to-port="0" /> + <edge from-layer="8821" from-port="1" to-layer="8823" to-port="0" /> + <edge from-layer="8822" from-port="0" to-layer="8823" to-port="2" /> + <edge from-layer="8823" from-port="3" to-layer="8824" to-port="0" /> + <edge from-layer="8824" from-port="2" to-layer="8825" to-port="0" /> + <edge from-layer="8825" from-port="1" to-layer="8827" to-port="0" /> + <edge from-layer="8826" from-port="0" to-layer="8827" to-port="1" /> + <edge from-layer="8827" from-port="2" to-layer="8837" to-port="2" /> + <edge from-layer="8827" from-port="2" to-layer="8831" to-port="1" /> + <edge from-layer="8828" from-port="0" to-layer="8831" to-port="2" /> + <edge from-layer="8829" from-port="0" to-layer="8831" to-port="3" /> + <edge from-layer="8830" from-port="0" to-layer="8831" to-port="4" /> + <edge from-layer="8831" from-port="5" to-layer="8833" to-port="0" /> + <edge from-layer="8832" from-port="0" to-layer="8833" to-port="1" /> + <edge from-layer="8833" from-port="2" to-layer="8838" to-port="0" /> + <edge from-layer="8834" from-port="0" to-layer="8837" to-port="1" /> + <edge from-layer="8835" from-port="0" to-layer="8837" to-port="3" /> + <edge from-layer="8836" from-port="0" to-layer="8837" to-port="4" /> + <edge from-layer="8837" from-port="5" to-layer="8838" to-port="1" /> + <edge from-layer="8838" from-port="2" to-layer="8839" to-port="0" /> + <edge from-layer="8839" from-port="2" to-layer="8840" to-port="1" /> + <edge from-layer="8840" from-port="2" to-layer="8901" to-port="0" /> + <edge from-layer="8840" from-port="2" to-layer="8841" to-port="1" /> + <edge from-layer="8841" from-port="2" to-layer="8842" to-port="0" /> + <edge from-layer="8841" from-port="2" to-layer="8843" to-port="0" /> + <edge from-layer="8841" from-port="2" to-layer="11164" to-port="0" /> + <edge from-layer="8842" from-port="2" to-layer="8852" to-port="0" /> + <edge from-layer="8843" from-port="1" to-layer="8850" to-port="0" /> + <edge from-layer="8843" from-port="1" to-layer="8846" to-port="0" /> + <edge from-layer="8844" from-port="0" to-layer="8846" to-port="1" /> + <edge from-layer="8845" from-port="0" to-layer="8846" to-port="2" /> + <edge from-layer="8846" from-port="3" to-layer="8851" to-port="0" /> + <edge from-layer="8847" from-port="0" to-layer="8851" to-port="1" /> + <edge from-layer="8848" from-port="0" to-layer="8850" to-port="1" /> + <edge from-layer="8849" from-port="0" to-layer="8850" to-port="2" /> + <edge from-layer="8850" from-port="3" to-layer="8851" to-port="2" /> + <edge from-layer="8851" from-port="3" to-layer="8852" to-port="1" /> + <edge from-layer="8852" from-port="2" to-layer="8854" to-port="0" /> + <edge from-layer="8853" from-port="0" to-layer="8854" to-port="1" /> + <edge from-layer="8854" from-port="2" to-layer="8909" to-port="1" /> + <edge from-layer="8855" from-port="0" to-layer="8860" to-port="0" /> + <edge from-layer="8856" from-port="0" to-layer="8859" to-port="1" /> + <edge from-layer="8857" from-port="0" to-layer="8859" to-port="2" /> + <edge from-layer="8858" from-port="0" to-layer="8859" to-port="3" /> + <edge from-layer="8859" from-port="4" to-layer="8860" to-port="1" /> + <edge from-layer="8860" from-port="2" to-layer="8861" to-port="0" /> + <edge from-layer="8861" from-port="1" to-layer="8863" to-port="0" /> + <edge from-layer="8862" from-port="0" to-layer="8863" to-port="2" /> + <edge from-layer="8863" from-port="3" to-layer="8882" to-port="0" /> + <edge from-layer="8864" from-port="0" to-layer="8865" to-port="0" /> + <edge from-layer="8865" from-port="1" to-layer="8868" to-port="0" /> + <edge from-layer="8866" from-port="0" to-layer="8867" to-port="0" /> + <edge from-layer="8867" from-port="1" to-layer="8868" to-port="1" /> + <edge from-layer="8868" from-port="2" to-layer="8870" to-port="0" /> + <edge from-layer="8869" from-port="0" to-layer="8870" to-port="1" /> + <edge from-layer="8870" from-port="2" to-layer="8872" to-port="0" /> + <edge from-layer="8871" from-port="0" to-layer="8872" to-port="1" /> + <edge from-layer="8872" from-port="2" to-layer="8873" to-port="0" /> + <edge from-layer="8873" from-port="1" to-layer="8874" to-port="1" /> + <edge from-layer="8874" from-port="2" to-layer="8877" to-port="0" /> + <edge from-layer="8875" from-port="0" to-layer="8876" to-port="0" /> + <edge from-layer="8876" from-port="1" to-layer="8877" to-port="1" /> + <edge from-layer="8877" from-port="2" to-layer="8879" to-port="0" /> + <edge from-layer="8878" from-port="0" to-layer="8879" to-port="1" /> + <edge from-layer="8879" from-port="2" to-layer="8881" to-port="0" /> + <edge from-layer="8880" from-port="0" to-layer="8881" to-port="1" /> + <edge from-layer="8881" from-port="2" to-layer="8882" to-port="1" /> + <edge from-layer="8882" from-port="2" to-layer="8883" to-port="0" /> + <edge from-layer="8882" from-port="2" to-layer="11163" to-port="0" /> + <edge from-layer="8882" from-port="2" to-layer="8884" to-port="0" /> + <edge from-layer="8883" from-port="2" to-layer="8893" to-port="0" /> + <edge from-layer="8884" from-port="1" to-layer="8891" to-port="0" /> + <edge from-layer="8884" from-port="1" to-layer="8887" to-port="0" /> + <edge from-layer="8885" from-port="0" to-layer="8887" to-port="1" /> + <edge from-layer="8886" from-port="0" to-layer="8887" to-port="2" /> + <edge from-layer="8887" from-port="3" to-layer="8892" to-port="1" /> + <edge from-layer="8888" from-port="0" to-layer="8892" to-port="2" /> + <edge from-layer="8889" from-port="0" to-layer="8891" to-port="1" /> + <edge from-layer="8890" from-port="0" to-layer="8891" to-port="2" /> + <edge from-layer="8891" from-port="3" to-layer="8892" to-port="3" /> + <edge from-layer="8892" from-port="4" to-layer="8893" to-port="1" /> + <edge from-layer="8893" from-port="2" to-layer="8895" to-port="0" /> + <edge from-layer="8894" from-port="0" to-layer="8895" to-port="1" /> + <edge from-layer="8895" from-port="2" to-layer="8909" to-port="2" /> + <edge from-layer="8896" from-port="0" to-layer="8908" to-port="1" /> + <edge from-layer="8897" from-port="1" to-layer="8900" to-port="0" /> + <edge from-layer="8898" from-port="0" to-layer="8900" to-port="1" /> + <edge from-layer="8899" from-port="0" to-layer="8900" to-port="2" /> + <edge from-layer="8900" from-port="3" to-layer="8905" to-port="0" /> + <edge from-layer="8901" from-port="1" to-layer="8904" to-port="0" /> + <edge from-layer="8902" from-port="0" to-layer="8904" to-port="1" /> + <edge from-layer="8903" from-port="0" to-layer="8904" to-port="2" /> + <edge from-layer="8904" from-port="3" to-layer="8905" to-port="1" /> + <edge from-layer="8905" from-port="2" to-layer="8908" to-port="2" /> + <edge from-layer="8906" from-port="0" to-layer="8908" to-port="3" /> + <edge from-layer="8907" from-port="0" to-layer="8908" to-port="4" /> + <edge from-layer="8908" from-port="5" to-layer="8909" to-port="3" /> + <edge from-layer="8909" from-port="4" to-layer="8911" to-port="0" /> + <edge from-layer="8910" from-port="0" to-layer="8911" to-port="1" /> + <edge from-layer="8911" from-port="2" to-layer="8913" to-port="0" /> + <edge from-layer="8912" from-port="0" to-layer="8913" to-port="1" /> + <edge from-layer="8913" from-port="2" to-layer="8924" to-port="0" /> + <edge from-layer="8914" from-port="0" to-layer="8915" to-port="0" /> + <edge from-layer="8915" from-port="1" to-layer="8918" to-port="0" /> + <edge from-layer="8916" from-port="0" to-layer="8917" to-port="0" /> + <edge from-layer="8917" from-port="1" to-layer="8918" to-port="1" /> + <edge from-layer="8918" from-port="2" to-layer="8920" to-port="0" /> + <edge from-layer="8919" from-port="0" to-layer="8920" to-port="1" /> + <edge from-layer="8920" from-port="2" to-layer="8922" to-port="0" /> + <edge from-layer="8921" from-port="0" to-layer="8922" to-port="1" /> + <edge from-layer="8922" from-port="2" to-layer="8923" to-port="0" /> + <edge from-layer="8923" from-port="1" to-layer="8924" to-port="1" /> + <edge from-layer="8924" from-port="2" to-layer="8925" to-port="1" /> + <edge from-layer="8925" from-port="2" to-layer="8929" to-port="0" /> + <edge from-layer="8925" from-port="2" to-layer="8973" to-port="0" /> + <edge from-layer="8925" from-port="2" to-layer="8936" to-port="0" /> + <edge from-layer="8926" from-port="0" to-layer="8937" to-port="0" /> + <edge from-layer="8927" from-port="0" to-layer="8935" to-port="0" /> + <edge from-layer="8928" from-port="0" to-layer="8929" to-port="1" /> + <edge from-layer="8929" from-port="2" to-layer="8931" to-port="0" /> + <edge from-layer="8930" from-port="0" to-layer="8931" to-port="1" /> + <edge from-layer="8931" from-port="2" to-layer="8933" to-port="0" /> + <edge from-layer="8932" from-port="0" to-layer="8933" to-port="1" /> + <edge from-layer="8933" from-port="2" to-layer="8934" to-port="0" /> + <edge from-layer="8934" from-port="1" to-layer="8935" to-port="1" /> + <edge from-layer="8935" from-port="2" to-layer="8936" to-port="1" /> + <edge from-layer="8936" from-port="2" to-layer="8937" to-port="1" /> + <edge from-layer="8937" from-port="2" to-layer="8960" to-port="0" /> + <edge from-layer="8937" from-port="2" to-layer="8948" to-port="0" /> + <edge from-layer="8938" from-port="0" to-layer="8939" to-port="0" /> + <edge from-layer="8939" from-port="1" to-layer="8942" to-port="0" /> + <edge from-layer="8940" from-port="0" to-layer="8941" to-port="0" /> + <edge from-layer="8941" from-port="1" to-layer="8942" to-port="1" /> + <edge from-layer="8942" from-port="2" to-layer="8944" to-port="0" /> + <edge from-layer="8943" from-port="0" to-layer="8944" to-port="1" /> + <edge from-layer="8944" from-port="2" to-layer="8946" to-port="0" /> + <edge from-layer="8945" from-port="0" to-layer="8946" to-port="1" /> + <edge from-layer="8946" from-port="2" to-layer="8947" to-port="0" /> + <edge from-layer="8947" from-port="1" to-layer="8948" to-port="1" /> + <edge from-layer="8948" from-port="2" to-layer="8949" to-port="0" /> + <edge from-layer="8949" from-port="1" to-layer="8961" to-port="0" /> + <edge from-layer="8950" from-port="0" to-layer="8951" to-port="0" /> + <edge from-layer="8951" from-port="1" to-layer="8954" to-port="0" /> + <edge from-layer="8952" from-port="0" to-layer="8953" to-port="0" /> + <edge from-layer="8953" from-port="1" to-layer="8954" to-port="1" /> + <edge from-layer="8954" from-port="2" to-layer="8956" to-port="0" /> + <edge from-layer="8955" from-port="0" to-layer="8956" to-port="1" /> + <edge from-layer="8956" from-port="2" to-layer="8958" to-port="0" /> + <edge from-layer="8957" from-port="0" to-layer="8958" to-port="1" /> + <edge from-layer="8958" from-port="2" to-layer="8959" to-port="0" /> + <edge from-layer="8959" from-port="1" to-layer="8960" to-port="1" /> + <edge from-layer="8960" from-port="2" to-layer="8961" to-port="1" /> + <edge from-layer="8961" from-port="2" to-layer="8972" to-port="0" /> + <edge from-layer="8962" from-port="0" to-layer="8963" to-port="0" /> + <edge from-layer="8963" from-port="1" to-layer="8966" to-port="0" /> + <edge from-layer="8964" from-port="0" to-layer="8965" to-port="0" /> + <edge from-layer="8965" from-port="1" to-layer="8966" to-port="1" /> + <edge from-layer="8966" from-port="2" to-layer="8968" to-port="0" /> + <edge from-layer="8967" from-port="0" to-layer="8968" to-port="1" /> + <edge from-layer="8968" from-port="2" to-layer="8970" to-port="0" /> + <edge from-layer="8969" from-port="0" to-layer="8970" to-port="1" /> + <edge from-layer="8970" from-port="2" to-layer="8971" to-port="0" /> + <edge from-layer="8971" from-port="1" to-layer="8972" to-port="1" /> + <edge from-layer="8972" from-port="2" to-layer="8973" to-port="1" /> + <edge from-layer="8973" from-port="2" to-layer="8977" to-port="0" /> + <edge from-layer="8973" from-port="2" to-layer="8984" to-port="0" /> + <edge from-layer="8973" from-port="2" to-layer="9157" to-port="0" /> + <edge from-layer="8974" from-port="0" to-layer="8985" to-port="0" /> + <edge from-layer="8975" from-port="0" to-layer="8983" to-port="0" /> + <edge from-layer="8976" from-port="0" to-layer="8977" to-port="1" /> + <edge from-layer="8977" from-port="2" to-layer="8979" to-port="0" /> + <edge from-layer="8978" from-port="0" to-layer="8979" to-port="1" /> + <edge from-layer="8979" from-port="2" to-layer="8981" to-port="0" /> + <edge from-layer="8980" from-port="0" to-layer="8981" to-port="1" /> + <edge from-layer="8981" from-port="2" to-layer="8982" to-port="0" /> + <edge from-layer="8982" from-port="1" to-layer="8983" to-port="1" /> + <edge from-layer="8983" from-port="2" to-layer="8984" to-port="1" /> + <edge from-layer="8984" from-port="2" to-layer="8985" to-port="1" /> + <edge from-layer="8985" from-port="2" to-layer="9044" to-port="0" /> + <edge from-layer="8985" from-port="2" to-layer="9106" to-port="0" /> + <edge from-layer="8985" from-port="2" to-layer="8996" to-port="0" /> + <edge from-layer="8986" from-port="0" to-layer="8987" to-port="0" /> + <edge from-layer="8987" from-port="1" to-layer="8990" to-port="0" /> + <edge from-layer="8988" from-port="0" to-layer="8989" to-port="0" /> + <edge from-layer="8989" from-port="1" to-layer="8990" to-port="1" /> + <edge from-layer="8990" from-port="2" to-layer="8992" to-port="0" /> + <edge from-layer="8991" from-port="0" to-layer="8992" to-port="1" /> + <edge from-layer="8992" from-port="2" to-layer="8994" to-port="0" /> + <edge from-layer="8993" from-port="0" to-layer="8994" to-port="1" /> + <edge from-layer="8994" from-port="2" to-layer="8995" to-port="0" /> + <edge from-layer="8995" from-port="1" to-layer="8996" to-port="1" /> + <edge from-layer="8996" from-port="2" to-layer="8999" to-port="0" /> + <edge from-layer="8997" from-port="0" to-layer="8998" to-port="0" /> + <edge from-layer="8998" from-port="1" to-layer="8999" to-port="1" /> + <edge from-layer="8999" from-port="2" to-layer="9001" to-port="0" /> + <edge from-layer="9000" from-port="0" to-layer="9001" to-port="1" /> + <edge from-layer="9001" from-port="2" to-layer="9003" to-port="0" /> + <edge from-layer="9002" from-port="0" to-layer="9003" to-port="1" /> + <edge from-layer="9003" from-port="2" to-layer="9005" to-port="0" /> + <edge from-layer="9003" from-port="2" to-layer="9021" to-port="0" /> + <edge from-layer="9003" from-port="2" to-layer="9015" to-port="0" /> + <edge from-layer="9003" from-port="2" to-layer="9004" to-port="0" /> + <edge from-layer="9004" from-port="2" to-layer="9024" to-port="0" /> + <edge from-layer="9005" from-port="1" to-layer="9007" to-port="0" /> + <edge from-layer="9006" from-port="0" to-layer="9007" to-port="2" /> + <edge from-layer="9007" from-port="3" to-layer="9008" to-port="0" /> + <edge from-layer="9008" from-port="2" to-layer="9009" to-port="0" /> + <edge from-layer="9009" from-port="1" to-layer="9011" to-port="0" /> + <edge from-layer="9010" from-port="0" to-layer="9011" to-port="1" /> + <edge from-layer="9011" from-port="2" to-layer="9021" to-port="2" /> + <edge from-layer="9011" from-port="2" to-layer="9015" to-port="1" /> + <edge from-layer="9012" from-port="0" to-layer="9015" to-port="2" /> + <edge from-layer="9013" from-port="0" to-layer="9015" to-port="3" /> + <edge from-layer="9014" from-port="0" to-layer="9015" to-port="4" /> + <edge from-layer="9015" from-port="5" to-layer="9017" to-port="0" /> + <edge from-layer="9016" from-port="0" to-layer="9017" to-port="1" /> + <edge from-layer="9017" from-port="2" to-layer="9022" to-port="0" /> + <edge from-layer="9018" from-port="0" to-layer="9021" to-port="1" /> + <edge from-layer="9019" from-port="0" to-layer="9021" to-port="3" /> + <edge from-layer="9020" from-port="0" to-layer="9021" to-port="4" /> + <edge from-layer="9021" from-port="5" to-layer="9022" to-port="1" /> + <edge from-layer="9022" from-port="2" to-layer="9023" to-port="0" /> + <edge from-layer="9023" from-port="2" to-layer="9024" to-port="1" /> + <edge from-layer="9024" from-port="2" to-layer="9141" to-port="0" /> + <edge from-layer="9025" from-port="0" to-layer="9030" to-port="0" /> + <edge from-layer="9026" from-port="0" to-layer="9029" to-port="1" /> + <edge from-layer="9027" from-port="0" to-layer="9029" to-port="2" /> + <edge from-layer="9028" from-port="0" to-layer="9029" to-port="3" /> + <edge from-layer="9029" from-port="4" to-layer="9030" to-port="1" /> + <edge from-layer="9030" from-port="2" to-layer="9031" to-port="0" /> + <edge from-layer="9031" from-port="1" to-layer="9033" to-port="0" /> + <edge from-layer="9032" from-port="0" to-layer="9033" to-port="2" /> + <edge from-layer="9033" from-port="3" to-layer="9073" to-port="0" /> + <edge from-layer="9033" from-port="3" to-layer="9129" to-port="0" /> + <edge from-layer="9034" from-port="0" to-layer="9035" to-port="0" /> + <edge from-layer="9035" from-port="1" to-layer="9038" to-port="0" /> + <edge from-layer="9036" from-port="0" to-layer="9037" to-port="0" /> + <edge from-layer="9037" from-port="1" to-layer="9038" to-port="1" /> + <edge from-layer="9038" from-port="2" to-layer="9040" to-port="0" /> + <edge from-layer="9039" from-port="0" to-layer="9040" to-port="1" /> + <edge from-layer="9040" from-port="2" to-layer="9042" to-port="0" /> + <edge from-layer="9041" from-port="0" to-layer="9042" to-port="1" /> + <edge from-layer="9042" from-port="2" to-layer="9043" to-port="0" /> + <edge from-layer="9043" from-port="1" to-layer="9044" to-port="1" /> + <edge from-layer="9044" from-port="2" to-layer="9047" to-port="0" /> + <edge from-layer="9045" from-port="0" to-layer="9046" to-port="0" /> + <edge from-layer="9046" from-port="1" to-layer="9047" to-port="1" /> + <edge from-layer="9047" from-port="2" to-layer="9049" to-port="0" /> + <edge from-layer="9048" from-port="0" to-layer="9049" to-port="1" /> + <edge from-layer="9049" from-port="2" to-layer="9051" to-port="0" /> + <edge from-layer="9050" from-port="0" to-layer="9051" to-port="1" /> + <edge from-layer="9051" from-port="2" to-layer="9052" to-port="0" /> + <edge from-layer="9051" from-port="2" to-layer="9053" to-port="0" /> + <edge from-layer="9051" from-port="2" to-layer="9069" to-port="0" /> + <edge from-layer="9051" from-port="2" to-layer="9063" to-port="0" /> + <edge from-layer="9052" from-port="2" to-layer="9072" to-port="0" /> + <edge from-layer="9053" from-port="1" to-layer="9055" to-port="0" /> + <edge from-layer="9054" from-port="0" to-layer="9055" to-port="2" /> + <edge from-layer="9055" from-port="3" to-layer="9056" to-port="0" /> + <edge from-layer="9056" from-port="2" to-layer="9057" to-port="0" /> + <edge from-layer="9057" from-port="1" to-layer="9059" to-port="0" /> + <edge from-layer="9058" from-port="0" to-layer="9059" to-port="1" /> + <edge from-layer="9059" from-port="2" to-layer="9063" to-port="1" /> + <edge from-layer="9059" from-port="2" to-layer="9069" to-port="2" /> + <edge from-layer="9060" from-port="0" to-layer="9063" to-port="2" /> + <edge from-layer="9061" from-port="0" to-layer="9063" to-port="3" /> + <edge from-layer="9062" from-port="0" to-layer="9063" to-port="4" /> + <edge from-layer="9063" from-port="5" to-layer="9065" to-port="0" /> + <edge from-layer="9064" from-port="0" to-layer="9065" to-port="1" /> + <edge from-layer="9065" from-port="2" to-layer="9070" to-port="0" /> + <edge from-layer="9066" from-port="0" to-layer="9069" to-port="1" /> + <edge from-layer="9067" from-port="0" to-layer="9069" to-port="3" /> + <edge from-layer="9068" from-port="0" to-layer="9069" to-port="4" /> + <edge from-layer="9069" from-port="5" to-layer="9070" to-port="1" /> + <edge from-layer="9070" from-port="2" to-layer="9071" to-port="0" /> + <edge from-layer="9071" from-port="2" to-layer="9072" to-port="1" /> + <edge from-layer="9072" from-port="2" to-layer="9133" to-port="0" /> + <edge from-layer="9072" from-port="2" to-layer="9073" to-port="1" /> + <edge from-layer="9073" from-port="2" to-layer="11162" to-port="0" /> + <edge from-layer="9073" from-port="2" to-layer="9075" to-port="0" /> + <edge from-layer="9073" from-port="2" to-layer="9074" to-port="0" /> + <edge from-layer="9074" from-port="2" to-layer="9084" to-port="0" /> + <edge from-layer="9075" from-port="1" to-layer="9078" to-port="0" /> + <edge from-layer="9075" from-port="1" to-layer="9082" to-port="0" /> + <edge from-layer="9076" from-port="0" to-layer="9078" to-port="1" /> + <edge from-layer="9077" from-port="0" to-layer="9078" to-port="2" /> + <edge from-layer="9078" from-port="3" to-layer="9083" to-port="0" /> + <edge from-layer="9079" from-port="0" to-layer="9083" to-port="1" /> + <edge from-layer="9080" from-port="0" to-layer="9082" to-port="1" /> + <edge from-layer="9081" from-port="0" to-layer="9082" to-port="2" /> + <edge from-layer="9082" from-port="3" to-layer="9083" to-port="2" /> + <edge from-layer="9083" from-port="3" to-layer="9084" to-port="1" /> + <edge from-layer="9084" from-port="2" to-layer="9086" to-port="0" /> + <edge from-layer="9085" from-port="0" to-layer="9086" to-port="1" /> + <edge from-layer="9086" from-port="2" to-layer="9141" to-port="1" /> + <edge from-layer="9087" from-port="0" to-layer="9092" to-port="0" /> + <edge from-layer="9088" from-port="0" to-layer="9091" to-port="1" /> + <edge from-layer="9089" from-port="0" to-layer="9091" to-port="2" /> + <edge from-layer="9090" from-port="0" to-layer="9091" to-port="3" /> + <edge from-layer="9091" from-port="4" to-layer="9092" to-port="1" /> + <edge from-layer="9092" from-port="2" to-layer="9093" to-port="0" /> + <edge from-layer="9093" from-port="1" to-layer="9095" to-port="0" /> + <edge from-layer="9094" from-port="0" to-layer="9095" to-port="2" /> + <edge from-layer="9095" from-port="3" to-layer="9114" to-port="0" /> + <edge from-layer="9096" from-port="0" to-layer="9097" to-port="0" /> + <edge from-layer="9097" from-port="1" to-layer="9100" to-port="0" /> + <edge from-layer="9098" from-port="0" to-layer="9099" to-port="0" /> + <edge from-layer="9099" from-port="1" to-layer="9100" to-port="1" /> + <edge from-layer="9100" from-port="2" to-layer="9102" to-port="0" /> + <edge from-layer="9101" from-port="0" to-layer="9102" to-port="1" /> + <edge from-layer="9102" from-port="2" to-layer="9104" to-port="0" /> + <edge from-layer="9103" from-port="0" to-layer="9104" to-port="1" /> + <edge from-layer="9104" from-port="2" to-layer="9105" to-port="0" /> + <edge from-layer="9105" from-port="1" to-layer="9106" to-port="1" /> + <edge from-layer="9106" from-port="2" to-layer="9109" to-port="0" /> + <edge from-layer="9107" from-port="0" to-layer="9108" to-port="0" /> + <edge from-layer="9108" from-port="1" to-layer="9109" to-port="1" /> + <edge from-layer="9109" from-port="2" to-layer="9111" to-port="0" /> + <edge from-layer="9110" from-port="0" to-layer="9111" to-port="1" /> + <edge from-layer="9111" from-port="2" to-layer="9113" to-port="0" /> + <edge from-layer="9112" from-port="0" to-layer="9113" to-port="1" /> + <edge from-layer="9113" from-port="2" to-layer="9114" to-port="1" /> + <edge from-layer="9114" from-port="2" to-layer="9115" to-port="0" /> + <edge from-layer="9114" from-port="2" to-layer="9116" to-port="0" /> + <edge from-layer="9114" from-port="2" to-layer="11161" to-port="0" /> + <edge from-layer="9115" from-port="2" to-layer="9125" to-port="0" /> + <edge from-layer="9116" from-port="1" to-layer="9119" to-port="0" /> + <edge from-layer="9116" from-port="1" to-layer="9123" to-port="0" /> + <edge from-layer="9117" from-port="0" to-layer="9119" to-port="1" /> + <edge from-layer="9118" from-port="0" to-layer="9119" to-port="2" /> + <edge from-layer="9119" from-port="3" to-layer="9124" to-port="1" /> + <edge from-layer="9120" from-port="0" to-layer="9124" to-port="2" /> + <edge from-layer="9121" from-port="0" to-layer="9123" to-port="1" /> + <edge from-layer="9122" from-port="0" to-layer="9123" to-port="2" /> + <edge from-layer="9123" from-port="3" to-layer="9124" to-port="3" /> + <edge from-layer="9124" from-port="4" to-layer="9125" to-port="1" /> + <edge from-layer="9125" from-port="2" to-layer="9127" to-port="0" /> + <edge from-layer="9126" from-port="0" to-layer="9127" to-port="1" /> + <edge from-layer="9127" from-port="2" to-layer="9141" to-port="2" /> + <edge from-layer="9128" from-port="0" to-layer="9140" to-port="1" /> + <edge from-layer="9129" from-port="1" to-layer="9132" to-port="0" /> + <edge from-layer="9130" from-port="0" to-layer="9132" to-port="1" /> + <edge from-layer="9131" from-port="0" to-layer="9132" to-port="2" /> + <edge from-layer="9132" from-port="3" to-layer="9137" to-port="0" /> + <edge from-layer="9133" from-port="1" to-layer="9136" to-port="0" /> + <edge from-layer="9134" from-port="0" to-layer="9136" to-port="1" /> + <edge from-layer="9135" from-port="0" to-layer="9136" to-port="2" /> + <edge from-layer="9136" from-port="3" to-layer="9137" to-port="1" /> + <edge from-layer="9137" from-port="2" to-layer="9140" to-port="2" /> + <edge from-layer="9138" from-port="0" to-layer="9140" to-port="3" /> + <edge from-layer="9139" from-port="0" to-layer="9140" to-port="4" /> + <edge from-layer="9140" from-port="5" to-layer="9141" to-port="3" /> + <edge from-layer="9141" from-port="4" to-layer="9143" to-port="0" /> + <edge from-layer="9142" from-port="0" to-layer="9143" to-port="1" /> + <edge from-layer="9143" from-port="2" to-layer="9145" to-port="0" /> + <edge from-layer="9144" from-port="0" to-layer="9145" to-port="1" /> + <edge from-layer="9145" from-port="2" to-layer="9156" to-port="0" /> + <edge from-layer="9146" from-port="0" to-layer="9147" to-port="0" /> + <edge from-layer="9147" from-port="1" to-layer="9150" to-port="0" /> + <edge from-layer="9148" from-port="0" to-layer="9149" to-port="0" /> + <edge from-layer="9149" from-port="1" to-layer="9150" to-port="1" /> + <edge from-layer="9150" from-port="2" to-layer="9152" to-port="0" /> + <edge from-layer="9151" from-port="0" to-layer="9152" to-port="1" /> + <edge from-layer="9152" from-port="2" to-layer="9154" to-port="0" /> + <edge from-layer="9153" from-port="0" to-layer="9154" to-port="1" /> + <edge from-layer="9154" from-port="2" to-layer="9155" to-port="0" /> + <edge from-layer="9155" from-port="1" to-layer="9156" to-port="1" /> + <edge from-layer="9156" from-port="2" to-layer="9157" to-port="1" /> + <edge from-layer="9157" from-port="2" to-layer="9205" to-port="0" /> + <edge from-layer="9157" from-port="2" to-layer="9168" to-port="0" /> + <edge from-layer="9157" from-port="2" to-layer="9161" to-port="0" /> + <edge from-layer="9158" from-port="0" to-layer="9169" to-port="0" /> + <edge from-layer="9159" from-port="0" to-layer="9167" to-port="0" /> + <edge from-layer="9160" from-port="0" to-layer="9161" to-port="1" /> + <edge from-layer="9161" from-port="2" to-layer="9163" to-port="0" /> + <edge from-layer="9162" from-port="0" to-layer="9163" to-port="1" /> + <edge from-layer="9163" from-port="2" to-layer="9165" to-port="0" /> + <edge from-layer="9164" from-port="0" to-layer="9165" to-port="1" /> + <edge from-layer="9165" from-port="2" to-layer="9166" to-port="0" /> + <edge from-layer="9166" from-port="1" to-layer="9167" to-port="1" /> + <edge from-layer="9167" from-port="2" to-layer="9168" to-port="1" /> + <edge from-layer="9168" from-port="2" to-layer="9169" to-port="1" /> + <edge from-layer="9169" from-port="2" to-layer="9192" to-port="0" /> + <edge from-layer="9169" from-port="2" to-layer="9180" to-port="0" /> + <edge from-layer="9170" from-port="0" to-layer="9171" to-port="0" /> + <edge from-layer="9171" from-port="1" to-layer="9174" to-port="0" /> + <edge from-layer="9172" from-port="0" to-layer="9173" to-port="0" /> + <edge from-layer="9173" from-port="1" to-layer="9174" to-port="1" /> + <edge from-layer="9174" from-port="2" to-layer="9176" to-port="0" /> + <edge from-layer="9175" from-port="0" to-layer="9176" to-port="1" /> + <edge from-layer="9176" from-port="2" to-layer="9178" to-port="0" /> + <edge from-layer="9177" from-port="0" to-layer="9178" to-port="1" /> + <edge from-layer="9178" from-port="2" to-layer="9179" to-port="0" /> + <edge from-layer="9179" from-port="1" to-layer="9180" to-port="1" /> + <edge from-layer="9180" from-port="2" to-layer="9181" to-port="0" /> + <edge from-layer="9181" from-port="1" to-layer="9193" to-port="0" /> + <edge from-layer="9182" from-port="0" to-layer="9183" to-port="0" /> + <edge from-layer="9183" from-port="1" to-layer="9186" to-port="0" /> + <edge from-layer="9184" from-port="0" to-layer="9185" to-port="0" /> + <edge from-layer="9185" from-port="1" to-layer="9186" to-port="1" /> + <edge from-layer="9186" from-port="2" to-layer="9188" to-port="0" /> + <edge from-layer="9187" from-port="0" to-layer="9188" to-port="1" /> + <edge from-layer="9188" from-port="2" to-layer="9190" to-port="0" /> + <edge from-layer="9189" from-port="0" to-layer="9190" to-port="1" /> + <edge from-layer="9190" from-port="2" to-layer="9191" to-port="0" /> + <edge from-layer="9191" from-port="1" to-layer="9192" to-port="1" /> + <edge from-layer="9192" from-port="2" to-layer="9193" to-port="1" /> + <edge from-layer="9193" from-port="2" to-layer="9204" to-port="0" /> + <edge from-layer="9194" from-port="0" to-layer="9195" to-port="0" /> + <edge from-layer="9195" from-port="1" to-layer="9198" to-port="0" /> + <edge from-layer="9196" from-port="0" to-layer="9197" to-port="0" /> + <edge from-layer="9197" from-port="1" to-layer="9198" to-port="1" /> + <edge from-layer="9198" from-port="2" to-layer="9200" to-port="0" /> + <edge from-layer="9199" from-port="0" to-layer="9200" to-port="1" /> + <edge from-layer="9200" from-port="2" to-layer="9202" to-port="0" /> + <edge from-layer="9201" from-port="0" to-layer="9202" to-port="1" /> + <edge from-layer="9202" from-port="2" to-layer="9203" to-port="0" /> + <edge from-layer="9203" from-port="1" to-layer="9204" to-port="1" /> + <edge from-layer="9204" from-port="2" to-layer="9205" to-port="1" /> + <edge from-layer="9205" from-port="2" to-layer="9389" to-port="0" /> + <edge from-layer="9205" from-port="2" to-layer="9216" to-port="0" /> + <edge from-layer="9205" from-port="2" to-layer="9209" to-port="0" /> + <edge from-layer="9206" from-port="0" to-layer="9217" to-port="0" /> + <edge from-layer="9207" from-port="0" to-layer="9215" to-port="0" /> + <edge from-layer="9208" from-port="0" to-layer="9209" to-port="1" /> + <edge from-layer="9209" from-port="2" to-layer="9211" to-port="0" /> + <edge from-layer="9210" from-port="0" to-layer="9211" to-port="1" /> + <edge from-layer="9211" from-port="2" to-layer="9213" to-port="0" /> + <edge from-layer="9212" from-port="0" to-layer="9213" to-port="1" /> + <edge from-layer="9213" from-port="2" to-layer="9214" to-port="0" /> + <edge from-layer="9214" from-port="1" to-layer="9215" to-port="1" /> + <edge from-layer="9215" from-port="2" to-layer="9216" to-port="1" /> + <edge from-layer="9216" from-port="2" to-layer="9217" to-port="1" /> + <edge from-layer="9217" from-port="2" to-layer="9276" to-port="0" /> + <edge from-layer="9217" from-port="2" to-layer="9338" to-port="0" /> + <edge from-layer="9217" from-port="2" to-layer="9228" to-port="0" /> + <edge from-layer="9218" from-port="0" to-layer="9219" to-port="0" /> + <edge from-layer="9219" from-port="1" to-layer="9222" to-port="0" /> + <edge from-layer="9220" from-port="0" to-layer="9221" to-port="0" /> + <edge from-layer="9221" from-port="1" to-layer="9222" to-port="1" /> + <edge from-layer="9222" from-port="2" to-layer="9224" to-port="0" /> + <edge from-layer="9223" from-port="0" to-layer="9224" to-port="1" /> + <edge from-layer="9224" from-port="2" to-layer="9226" to-port="0" /> + <edge from-layer="9225" from-port="0" to-layer="9226" to-port="1" /> + <edge from-layer="9226" from-port="2" to-layer="9227" to-port="0" /> + <edge from-layer="9227" from-port="1" to-layer="9228" to-port="1" /> + <edge from-layer="9228" from-port="2" to-layer="9231" to-port="0" /> + <edge from-layer="9229" from-port="0" to-layer="9230" to-port="0" /> + <edge from-layer="9230" from-port="1" to-layer="9231" to-port="1" /> + <edge from-layer="9231" from-port="2" to-layer="9233" to-port="0" /> + <edge from-layer="9232" from-port="0" to-layer="9233" to-port="1" /> + <edge from-layer="9233" from-port="2" to-layer="9235" to-port="0" /> + <edge from-layer="9234" from-port="0" to-layer="9235" to-port="1" /> + <edge from-layer="9235" from-port="2" to-layer="9253" to-port="0" /> + <edge from-layer="9235" from-port="2" to-layer="9237" to-port="0" /> + <edge from-layer="9235" from-port="2" to-layer="9236" to-port="0" /> + <edge from-layer="9235" from-port="2" to-layer="9247" to-port="0" /> + <edge from-layer="9236" from-port="2" to-layer="9256" to-port="0" /> + <edge from-layer="9237" from-port="1" to-layer="9239" to-port="0" /> + <edge from-layer="9238" from-port="0" to-layer="9239" to-port="2" /> + <edge from-layer="9239" from-port="3" to-layer="9240" to-port="0" /> + <edge from-layer="9240" from-port="2" to-layer="9241" to-port="0" /> + <edge from-layer="9241" from-port="1" to-layer="9243" to-port="0" /> + <edge from-layer="9242" from-port="0" to-layer="9243" to-port="1" /> + <edge from-layer="9243" from-port="2" to-layer="9253" to-port="2" /> + <edge from-layer="9243" from-port="2" to-layer="9247" to-port="1" /> + <edge from-layer="9244" from-port="0" to-layer="9247" to-port="2" /> + <edge from-layer="9245" from-port="0" to-layer="9247" to-port="3" /> + <edge from-layer="9246" from-port="0" to-layer="9247" to-port="4" /> + <edge from-layer="9247" from-port="5" to-layer="9249" to-port="0" /> + <edge from-layer="9248" from-port="0" to-layer="9249" to-port="1" /> + <edge from-layer="9249" from-port="2" to-layer="9254" to-port="0" /> + <edge from-layer="9250" from-port="0" to-layer="9253" to-port="1" /> + <edge from-layer="9251" from-port="0" to-layer="9253" to-port="3" /> + <edge from-layer="9252" from-port="0" to-layer="9253" to-port="4" /> + <edge from-layer="9253" from-port="5" to-layer="9254" to-port="1" /> + <edge from-layer="9254" from-port="2" to-layer="9255" to-port="0" /> + <edge from-layer="9255" from-port="2" to-layer="9256" to-port="1" /> + <edge from-layer="9256" from-port="2" to-layer="9373" to-port="0" /> + <edge from-layer="9257" from-port="0" to-layer="9262" to-port="0" /> + <edge from-layer="9258" from-port="0" to-layer="9261" to-port="1" /> + <edge from-layer="9259" from-port="0" to-layer="9261" to-port="2" /> + <edge from-layer="9260" from-port="0" to-layer="9261" to-port="3" /> + <edge from-layer="9261" from-port="4" to-layer="9262" to-port="1" /> + <edge from-layer="9262" from-port="2" to-layer="9263" to-port="0" /> + <edge from-layer="9263" from-port="1" to-layer="9265" to-port="0" /> + <edge from-layer="9264" from-port="0" to-layer="9265" to-port="2" /> + <edge from-layer="9265" from-port="3" to-layer="9361" to-port="0" /> + <edge from-layer="9265" from-port="3" to-layer="9305" to-port="0" /> + <edge from-layer="9266" from-port="0" to-layer="9267" to-port="0" /> + <edge from-layer="9267" from-port="1" to-layer="9270" to-port="0" /> + <edge from-layer="9268" from-port="0" to-layer="9269" to-port="0" /> + <edge from-layer="9269" from-port="1" to-layer="9270" to-port="1" /> + <edge from-layer="9270" from-port="2" to-layer="9272" to-port="0" /> + <edge from-layer="9271" from-port="0" to-layer="9272" to-port="1" /> + <edge from-layer="9272" from-port="2" to-layer="9274" to-port="0" /> + <edge from-layer="9273" from-port="0" to-layer="9274" to-port="1" /> + <edge from-layer="9274" from-port="2" to-layer="9275" to-port="0" /> + <edge from-layer="9275" from-port="1" to-layer="9276" to-port="1" /> + <edge from-layer="9276" from-port="2" to-layer="9279" to-port="0" /> + <edge from-layer="9277" from-port="0" to-layer="9278" to-port="0" /> + <edge from-layer="9278" from-port="1" to-layer="9279" to-port="1" /> + <edge from-layer="9279" from-port="2" to-layer="9281" to-port="0" /> + <edge from-layer="9280" from-port="0" to-layer="9281" to-port="1" /> + <edge from-layer="9281" from-port="2" to-layer="9283" to-port="0" /> + <edge from-layer="9282" from-port="0" to-layer="9283" to-port="1" /> + <edge from-layer="9283" from-port="2" to-layer="9284" to-port="0" /> + <edge from-layer="9283" from-port="2" to-layer="9285" to-port="0" /> + <edge from-layer="9283" from-port="2" to-layer="9301" to-port="0" /> + <edge from-layer="9283" from-port="2" to-layer="9295" to-port="0" /> + <edge from-layer="9284" from-port="2" to-layer="9304" to-port="0" /> + <edge from-layer="9285" from-port="1" to-layer="9287" to-port="0" /> + <edge from-layer="9286" from-port="0" to-layer="9287" to-port="2" /> + <edge from-layer="9287" from-port="3" to-layer="9288" to-port="0" /> + <edge from-layer="9288" from-port="2" to-layer="9289" to-port="0" /> + <edge from-layer="9289" from-port="1" to-layer="9291" to-port="0" /> + <edge from-layer="9290" from-port="0" to-layer="9291" to-port="1" /> + <edge from-layer="9291" from-port="2" to-layer="9301" to-port="2" /> + <edge from-layer="9291" from-port="2" to-layer="9295" to-port="1" /> + <edge from-layer="9292" from-port="0" to-layer="9295" to-port="2" /> + <edge from-layer="9293" from-port="0" to-layer="9295" to-port="3" /> + <edge from-layer="9294" from-port="0" to-layer="9295" to-port="4" /> + <edge from-layer="9295" from-port="5" to-layer="9297" to-port="0" /> + <edge from-layer="9296" from-port="0" to-layer="9297" to-port="1" /> + <edge from-layer="9297" from-port="2" to-layer="9302" to-port="0" /> + <edge from-layer="9298" from-port="0" to-layer="9301" to-port="1" /> + <edge from-layer="9299" from-port="0" to-layer="9301" to-port="3" /> + <edge from-layer="9300" from-port="0" to-layer="9301" to-port="4" /> + <edge from-layer="9301" from-port="5" to-layer="9302" to-port="1" /> + <edge from-layer="9302" from-port="2" to-layer="9303" to-port="0" /> + <edge from-layer="9303" from-port="2" to-layer="9304" to-port="1" /> + <edge from-layer="9304" from-port="2" to-layer="9305" to-port="1" /> + <edge from-layer="9304" from-port="2" to-layer="9365" to-port="0" /> + <edge from-layer="9305" from-port="2" to-layer="9306" to-port="0" /> + <edge from-layer="9305" from-port="2" to-layer="11160" to-port="0" /> + <edge from-layer="9305" from-port="2" to-layer="9307" to-port="0" /> + <edge from-layer="9306" from-port="2" to-layer="9316" to-port="0" /> + <edge from-layer="9307" from-port="1" to-layer="9310" to-port="0" /> + <edge from-layer="9307" from-port="1" to-layer="9314" to-port="0" /> + <edge from-layer="9308" from-port="0" to-layer="9310" to-port="1" /> + <edge from-layer="9309" from-port="0" to-layer="9310" to-port="2" /> + <edge from-layer="9310" from-port="3" to-layer="9315" to-port="0" /> + <edge from-layer="9311" from-port="0" to-layer="9315" to-port="1" /> + <edge from-layer="9312" from-port="0" to-layer="9314" to-port="1" /> + <edge from-layer="9313" from-port="0" to-layer="9314" to-port="2" /> + <edge from-layer="9314" from-port="3" to-layer="9315" to-port="2" /> + <edge from-layer="9315" from-port="3" to-layer="9316" to-port="1" /> + <edge from-layer="9316" from-port="2" to-layer="9318" to-port="0" /> + <edge from-layer="9317" from-port="0" to-layer="9318" to-port="1" /> + <edge from-layer="9318" from-port="2" to-layer="9373" to-port="1" /> + <edge from-layer="9319" from-port="0" to-layer="9324" to-port="0" /> + <edge from-layer="9320" from-port="0" to-layer="9323" to-port="1" /> + <edge from-layer="9321" from-port="0" to-layer="9323" to-port="2" /> + <edge from-layer="9322" from-port="0" to-layer="9323" to-port="3" /> + <edge from-layer="9323" from-port="4" to-layer="9324" to-port="1" /> + <edge from-layer="9324" from-port="2" to-layer="9325" to-port="0" /> + <edge from-layer="9325" from-port="1" to-layer="9327" to-port="0" /> + <edge from-layer="9326" from-port="0" to-layer="9327" to-port="2" /> + <edge from-layer="9327" from-port="3" to-layer="9346" to-port="0" /> + <edge from-layer="9328" from-port="0" to-layer="9329" to-port="0" /> + <edge from-layer="9329" from-port="1" to-layer="9332" to-port="0" /> + <edge from-layer="9330" from-port="0" to-layer="9331" to-port="0" /> + <edge from-layer="9331" from-port="1" to-layer="9332" to-port="1" /> + <edge from-layer="9332" from-port="2" to-layer="9334" to-port="0" /> + <edge from-layer="9333" from-port="0" to-layer="9334" to-port="1" /> + <edge from-layer="9334" from-port="2" to-layer="9336" to-port="0" /> + <edge from-layer="9335" from-port="0" to-layer="9336" to-port="1" /> + <edge from-layer="9336" from-port="2" to-layer="9337" to-port="0" /> + <edge from-layer="9337" from-port="1" to-layer="9338" to-port="1" /> + <edge from-layer="9338" from-port="2" to-layer="9341" to-port="0" /> + <edge from-layer="9339" from-port="0" to-layer="9340" to-port="0" /> + <edge from-layer="9340" from-port="1" to-layer="9341" to-port="1" /> + <edge from-layer="9341" from-port="2" to-layer="9343" to-port="0" /> + <edge from-layer="9342" from-port="0" to-layer="9343" to-port="1" /> + <edge from-layer="9343" from-port="2" to-layer="9345" to-port="0" /> + <edge from-layer="9344" from-port="0" to-layer="9345" to-port="1" /> + <edge from-layer="9345" from-port="2" to-layer="9346" to-port="1" /> + <edge from-layer="9346" from-port="2" to-layer="9347" to-port="0" /> + <edge from-layer="9346" from-port="2" to-layer="9348" to-port="0" /> + <edge from-layer="9346" from-port="2" to-layer="11159" to-port="0" /> + <edge from-layer="9347" from-port="2" to-layer="9357" to-port="0" /> + <edge from-layer="9348" from-port="1" to-layer="9351" to-port="0" /> + <edge from-layer="9348" from-port="1" to-layer="9355" to-port="0" /> + <edge from-layer="9349" from-port="0" to-layer="9351" to-port="1" /> + <edge from-layer="9350" from-port="0" to-layer="9351" to-port="2" /> + <edge from-layer="9351" from-port="3" to-layer="9356" to-port="1" /> + <edge from-layer="9352" from-port="0" to-layer="9356" to-port="2" /> + <edge from-layer="9353" from-port="0" to-layer="9355" to-port="1" /> + <edge from-layer="9354" from-port="0" to-layer="9355" to-port="2" /> + <edge from-layer="9355" from-port="3" to-layer="9356" to-port="3" /> + <edge from-layer="9356" from-port="4" to-layer="9357" to-port="1" /> + <edge from-layer="9357" from-port="2" to-layer="9359" to-port="0" /> + <edge from-layer="9358" from-port="0" to-layer="9359" to-port="1" /> + <edge from-layer="9359" from-port="2" to-layer="9373" to-port="2" /> + <edge from-layer="9360" from-port="0" to-layer="9372" to-port="1" /> + <edge from-layer="9361" from-port="1" to-layer="9364" to-port="0" /> + <edge from-layer="9362" from-port="0" to-layer="9364" to-port="1" /> + <edge from-layer="9363" from-port="0" to-layer="9364" to-port="2" /> + <edge from-layer="9364" from-port="3" to-layer="9369" to-port="0" /> + <edge from-layer="9365" from-port="1" to-layer="9368" to-port="0" /> + <edge from-layer="9366" from-port="0" to-layer="9368" to-port="1" /> + <edge from-layer="9367" from-port="0" to-layer="9368" to-port="2" /> + <edge from-layer="9368" from-port="3" to-layer="9369" to-port="1" /> + <edge from-layer="9369" from-port="2" to-layer="9372" to-port="2" /> + <edge from-layer="9370" from-port="0" to-layer="9372" to-port="3" /> + <edge from-layer="9371" from-port="0" to-layer="9372" to-port="4" /> + <edge from-layer="9372" from-port="5" to-layer="9373" to-port="3" /> + <edge from-layer="9373" from-port="4" to-layer="9375" to-port="0" /> + <edge from-layer="9374" from-port="0" to-layer="9375" to-port="1" /> + <edge from-layer="9375" from-port="2" to-layer="9377" to-port="0" /> + <edge from-layer="9376" from-port="0" to-layer="9377" to-port="1" /> + <edge from-layer="9377" from-port="2" to-layer="9388" to-port="0" /> + <edge from-layer="9378" from-port="0" to-layer="9379" to-port="0" /> + <edge from-layer="9379" from-port="1" to-layer="9382" to-port="0" /> + <edge from-layer="9380" from-port="0" to-layer="9381" to-port="0" /> + <edge from-layer="9381" from-port="1" to-layer="9382" to-port="1" /> + <edge from-layer="9382" from-port="2" to-layer="9384" to-port="0" /> + <edge from-layer="9383" from-port="0" to-layer="9384" to-port="1" /> + <edge from-layer="9384" from-port="2" to-layer="9386" to-port="0" /> + <edge from-layer="9385" from-port="0" to-layer="9386" to-port="1" /> + <edge from-layer="9386" from-port="2" to-layer="9387" to-port="0" /> + <edge from-layer="9387" from-port="1" to-layer="9388" to-port="1" /> + <edge from-layer="9388" from-port="2" to-layer="9389" to-port="1" /> + <edge from-layer="9389" from-port="2" to-layer="9437" to-port="0" /> + <edge from-layer="9389" from-port="2" to-layer="9400" to-port="0" /> + <edge from-layer="9389" from-port="2" to-layer="9393" to-port="0" /> + <edge from-layer="9390" from-port="0" to-layer="9401" to-port="0" /> + <edge from-layer="9391" from-port="0" to-layer="9399" to-port="0" /> + <edge from-layer="9392" from-port="0" to-layer="9393" to-port="1" /> + <edge from-layer="9393" from-port="2" to-layer="9395" to-port="0" /> + <edge from-layer="9394" from-port="0" to-layer="9395" to-port="1" /> + <edge from-layer="9395" from-port="2" to-layer="9397" to-port="0" /> + <edge from-layer="9396" from-port="0" to-layer="9397" to-port="1" /> + <edge from-layer="9397" from-port="2" to-layer="9398" to-port="0" /> + <edge from-layer="9398" from-port="1" to-layer="9399" to-port="1" /> + <edge from-layer="9399" from-port="2" to-layer="9400" to-port="1" /> + <edge from-layer="9400" from-port="2" to-layer="9401" to-port="1" /> + <edge from-layer="9401" from-port="2" to-layer="9412" to-port="0" /> + <edge from-layer="9401" from-port="2" to-layer="9424" to-port="0" /> + <edge from-layer="9402" from-port="0" to-layer="9403" to-port="0" /> + <edge from-layer="9403" from-port="1" to-layer="9406" to-port="0" /> + <edge from-layer="9404" from-port="0" to-layer="9405" to-port="0" /> + <edge from-layer="9405" from-port="1" to-layer="9406" to-port="1" /> + <edge from-layer="9406" from-port="2" to-layer="9408" to-port="0" /> + <edge from-layer="9407" from-port="0" to-layer="9408" to-port="1" /> + <edge from-layer="9408" from-port="2" to-layer="9410" to-port="0" /> + <edge from-layer="9409" from-port="0" to-layer="9410" to-port="1" /> + <edge from-layer="9410" from-port="2" to-layer="9411" to-port="0" /> + <edge from-layer="9411" from-port="1" to-layer="9412" to-port="1" /> + <edge from-layer="9412" from-port="2" to-layer="9413" to-port="0" /> + <edge from-layer="9413" from-port="1" to-layer="9425" to-port="0" /> + <edge from-layer="9414" from-port="0" to-layer="9415" to-port="0" /> + <edge from-layer="9415" from-port="1" to-layer="9418" to-port="0" /> + <edge from-layer="9416" from-port="0" to-layer="9417" to-port="0" /> + <edge from-layer="9417" from-port="1" to-layer="9418" to-port="1" /> + <edge from-layer="9418" from-port="2" to-layer="9420" to-port="0" /> + <edge from-layer="9419" from-port="0" to-layer="9420" to-port="1" /> + <edge from-layer="9420" from-port="2" to-layer="9422" to-port="0" /> + <edge from-layer="9421" from-port="0" to-layer="9422" to-port="1" /> + <edge from-layer="9422" from-port="2" to-layer="9423" to-port="0" /> + <edge from-layer="9423" from-port="1" to-layer="9424" to-port="1" /> + <edge from-layer="9424" from-port="2" to-layer="9425" to-port="1" /> + <edge from-layer="9425" from-port="2" to-layer="9436" to-port="0" /> + <edge from-layer="9426" from-port="0" to-layer="9427" to-port="0" /> + <edge from-layer="9427" from-port="1" to-layer="9430" to-port="0" /> + <edge from-layer="9428" from-port="0" to-layer="9429" to-port="0" /> + <edge from-layer="9429" from-port="1" to-layer="9430" to-port="1" /> + <edge from-layer="9430" from-port="2" to-layer="9432" to-port="0" /> + <edge from-layer="9431" from-port="0" to-layer="9432" to-port="1" /> + <edge from-layer="9432" from-port="2" to-layer="9434" to-port="0" /> + <edge from-layer="9433" from-port="0" to-layer="9434" to-port="1" /> + <edge from-layer="9434" from-port="2" to-layer="9435" to-port="0" /> + <edge from-layer="9435" from-port="1" to-layer="9436" to-port="1" /> + <edge from-layer="9436" from-port="2" to-layer="9437" to-port="1" /> + <edge from-layer="9437" from-port="2" to-layer="9441" to-port="0" /> + <edge from-layer="9437" from-port="2" to-layer="9621" to-port="0" /> + <edge from-layer="9437" from-port="2" to-layer="9448" to-port="0" /> + <edge from-layer="9438" from-port="0" to-layer="9449" to-port="0" /> + <edge from-layer="9439" from-port="0" to-layer="9447" to-port="0" /> + <edge from-layer="9440" from-port="0" to-layer="9441" to-port="1" /> + <edge from-layer="9441" from-port="2" to-layer="9443" to-port="0" /> + <edge from-layer="9442" from-port="0" to-layer="9443" to-port="1" /> + <edge from-layer="9443" from-port="2" to-layer="9445" to-port="0" /> + <edge from-layer="9444" from-port="0" to-layer="9445" to-port="1" /> + <edge from-layer="9445" from-port="2" to-layer="9446" to-port="0" /> + <edge from-layer="9446" from-port="1" to-layer="9447" to-port="1" /> + <edge from-layer="9447" from-port="2" to-layer="9448" to-port="1" /> + <edge from-layer="9448" from-port="2" to-layer="9449" to-port="1" /> + <edge from-layer="9449" from-port="2" to-layer="9460" to-port="0" /> + <edge from-layer="9449" from-port="2" to-layer="9570" to-port="0" /> + <edge from-layer="9449" from-port="2" to-layer="9508" to-port="0" /> + <edge from-layer="9450" from-port="0" to-layer="9451" to-port="0" /> + <edge from-layer="9451" from-port="1" to-layer="9454" to-port="0" /> + <edge from-layer="9452" from-port="0" to-layer="9453" to-port="0" /> + <edge from-layer="9453" from-port="1" to-layer="9454" to-port="1" /> + <edge from-layer="9454" from-port="2" to-layer="9456" to-port="0" /> + <edge from-layer="9455" from-port="0" to-layer="9456" to-port="1" /> + <edge from-layer="9456" from-port="2" to-layer="9458" to-port="0" /> + <edge from-layer="9457" from-port="0" to-layer="9458" to-port="1" /> + <edge from-layer="9458" from-port="2" to-layer="9459" to-port="0" /> + <edge from-layer="9459" from-port="1" to-layer="9460" to-port="1" /> + <edge from-layer="9460" from-port="2" to-layer="9463" to-port="0" /> + <edge from-layer="9461" from-port="0" to-layer="9462" to-port="0" /> + <edge from-layer="9462" from-port="1" to-layer="9463" to-port="1" /> + <edge from-layer="9463" from-port="2" to-layer="9465" to-port="0" /> + <edge from-layer="9464" from-port="0" to-layer="9465" to-port="1" /> + <edge from-layer="9465" from-port="2" to-layer="9467" to-port="0" /> + <edge from-layer="9466" from-port="0" to-layer="9467" to-port="1" /> + <edge from-layer="9467" from-port="2" to-layer="9485" to-port="0" /> + <edge from-layer="9467" from-port="2" to-layer="9468" to-port="0" /> + <edge from-layer="9467" from-port="2" to-layer="9469" to-port="0" /> + <edge from-layer="9467" from-port="2" to-layer="9479" to-port="0" /> + <edge from-layer="9468" from-port="2" to-layer="9488" to-port="0" /> + <edge from-layer="9469" from-port="1" to-layer="9471" to-port="0" /> + <edge from-layer="9470" from-port="0" to-layer="9471" to-port="2" /> + <edge from-layer="9471" from-port="3" to-layer="9472" to-port="0" /> + <edge from-layer="9472" from-port="2" to-layer="9473" to-port="0" /> + <edge from-layer="9473" from-port="1" to-layer="9475" to-port="0" /> + <edge from-layer="9474" from-port="0" to-layer="9475" to-port="1" /> + <edge from-layer="9475" from-port="2" to-layer="9485" to-port="2" /> + <edge from-layer="9475" from-port="2" to-layer="9479" to-port="1" /> + <edge from-layer="9476" from-port="0" to-layer="9479" to-port="2" /> + <edge from-layer="9477" from-port="0" to-layer="9479" to-port="3" /> + <edge from-layer="9478" from-port="0" to-layer="9479" to-port="4" /> + <edge from-layer="9479" from-port="5" to-layer="9481" to-port="0" /> + <edge from-layer="9480" from-port="0" to-layer="9481" to-port="1" /> + <edge from-layer="9481" from-port="2" to-layer="9486" to-port="0" /> + <edge from-layer="9482" from-port="0" to-layer="9485" to-port="1" /> + <edge from-layer="9483" from-port="0" to-layer="9485" to-port="3" /> + <edge from-layer="9484" from-port="0" to-layer="9485" to-port="4" /> + <edge from-layer="9485" from-port="5" to-layer="9486" to-port="1" /> + <edge from-layer="9486" from-port="2" to-layer="9487" to-port="0" /> + <edge from-layer="9487" from-port="2" to-layer="9488" to-port="1" /> + <edge from-layer="9488" from-port="2" to-layer="9605" to-port="0" /> + <edge from-layer="9489" from-port="0" to-layer="9494" to-port="0" /> + <edge from-layer="9490" from-port="0" to-layer="9493" to-port="1" /> + <edge from-layer="9491" from-port="0" to-layer="9493" to-port="2" /> + <edge from-layer="9492" from-port="0" to-layer="9493" to-port="3" /> + <edge from-layer="9493" from-port="4" to-layer="9494" to-port="1" /> + <edge from-layer="9494" from-port="2" to-layer="9495" to-port="0" /> + <edge from-layer="9495" from-port="1" to-layer="9497" to-port="0" /> + <edge from-layer="9496" from-port="0" to-layer="9497" to-port="2" /> + <edge from-layer="9497" from-port="3" to-layer="9593" to-port="0" /> + <edge from-layer="9497" from-port="3" to-layer="9537" to-port="0" /> + <edge from-layer="9498" from-port="0" to-layer="9499" to-port="0" /> + <edge from-layer="9499" from-port="1" to-layer="9502" to-port="0" /> + <edge from-layer="9500" from-port="0" to-layer="9501" to-port="0" /> + <edge from-layer="9501" from-port="1" to-layer="9502" to-port="1" /> + <edge from-layer="9502" from-port="2" to-layer="9504" to-port="0" /> + <edge from-layer="9503" from-port="0" to-layer="9504" to-port="1" /> + <edge from-layer="9504" from-port="2" to-layer="9506" to-port="0" /> + <edge from-layer="9505" from-port="0" to-layer="9506" to-port="1" /> + <edge from-layer="9506" from-port="2" to-layer="9507" to-port="0" /> + <edge from-layer="9507" from-port="1" to-layer="9508" to-port="1" /> + <edge from-layer="9508" from-port="2" to-layer="9511" to-port="0" /> + <edge from-layer="9509" from-port="0" to-layer="9510" to-port="0" /> + <edge from-layer="9510" from-port="1" to-layer="9511" to-port="1" /> + <edge from-layer="9511" from-port="2" to-layer="9513" to-port="0" /> + <edge from-layer="9512" from-port="0" to-layer="9513" to-port="1" /> + <edge from-layer="9513" from-port="2" to-layer="9515" to-port="0" /> + <edge from-layer="9514" from-port="0" to-layer="9515" to-port="1" /> + <edge from-layer="9515" from-port="2" to-layer="9533" to-port="0" /> + <edge from-layer="9515" from-port="2" to-layer="9516" to-port="0" /> + <edge from-layer="9515" from-port="2" to-layer="9527" to-port="0" /> + <edge from-layer="9515" from-port="2" to-layer="9517" to-port="0" /> + <edge from-layer="9516" from-port="2" to-layer="9536" to-port="0" /> + <edge from-layer="9517" from-port="1" to-layer="9519" to-port="0" /> + <edge from-layer="9518" from-port="0" to-layer="9519" to-port="2" /> + <edge from-layer="9519" from-port="3" to-layer="9520" to-port="0" /> + <edge from-layer="9520" from-port="2" to-layer="9521" to-port="0" /> + <edge from-layer="9521" from-port="1" to-layer="9523" to-port="0" /> + <edge from-layer="9522" from-port="0" to-layer="9523" to-port="1" /> + <edge from-layer="9523" from-port="2" to-layer="9527" to-port="1" /> + <edge from-layer="9523" from-port="2" to-layer="9533" to-port="2" /> + <edge from-layer="9524" from-port="0" to-layer="9527" to-port="2" /> + <edge from-layer="9525" from-port="0" to-layer="9527" to-port="3" /> + <edge from-layer="9526" from-port="0" to-layer="9527" to-port="4" /> + <edge from-layer="9527" from-port="5" to-layer="9529" to-port="0" /> + <edge from-layer="9528" from-port="0" to-layer="9529" to-port="1" /> + <edge from-layer="9529" from-port="2" to-layer="9534" to-port="0" /> + <edge from-layer="9530" from-port="0" to-layer="9533" to-port="1" /> + <edge from-layer="9531" from-port="0" to-layer="9533" to-port="3" /> + <edge from-layer="9532" from-port="0" to-layer="9533" to-port="4" /> + <edge from-layer="9533" from-port="5" to-layer="9534" to-port="1" /> + <edge from-layer="9534" from-port="2" to-layer="9535" to-port="0" /> + <edge from-layer="9535" from-port="2" to-layer="9536" to-port="1" /> + <edge from-layer="9536" from-port="2" to-layer="9597" to-port="0" /> + <edge from-layer="9536" from-port="2" to-layer="9537" to-port="1" /> + <edge from-layer="9537" from-port="2" to-layer="9538" to-port="0" /> + <edge from-layer="9537" from-port="2" to-layer="11156" to-port="0" /> + <edge from-layer="9537" from-port="2" to-layer="9539" to-port="0" /> + <edge from-layer="9538" from-port="2" to-layer="9548" to-port="0" /> + <edge from-layer="9539" from-port="1" to-layer="9542" to-port="0" /> + <edge from-layer="9539" from-port="1" to-layer="9546" to-port="0" /> + <edge from-layer="9540" from-port="0" to-layer="9542" to-port="1" /> + <edge from-layer="9541" from-port="0" to-layer="9542" to-port="2" /> + <edge from-layer="9542" from-port="3" to-layer="9547" to-port="0" /> + <edge from-layer="9543" from-port="0" to-layer="9547" to-port="1" /> + <edge from-layer="9544" from-port="0" to-layer="9546" to-port="1" /> + <edge from-layer="9545" from-port="0" to-layer="9546" to-port="2" /> + <edge from-layer="9546" from-port="3" to-layer="9547" to-port="2" /> + <edge from-layer="9547" from-port="3" to-layer="9548" to-port="1" /> + <edge from-layer="9548" from-port="2" to-layer="9550" to-port="0" /> + <edge from-layer="9549" from-port="0" to-layer="9550" to-port="1" /> + <edge from-layer="9550" from-port="2" to-layer="9605" to-port="1" /> + <edge from-layer="9551" from-port="0" to-layer="9556" to-port="0" /> + <edge from-layer="9552" from-port="0" to-layer="9555" to-port="1" /> + <edge from-layer="9553" from-port="0" to-layer="9555" to-port="2" /> + <edge from-layer="9554" from-port="0" to-layer="9555" to-port="3" /> + <edge from-layer="9555" from-port="4" to-layer="9556" to-port="1" /> + <edge from-layer="9556" from-port="2" to-layer="9557" to-port="0" /> + <edge from-layer="9557" from-port="1" to-layer="9559" to-port="0" /> + <edge from-layer="9558" from-port="0" to-layer="9559" to-port="2" /> + <edge from-layer="9559" from-port="3" to-layer="9578" to-port="0" /> + <edge from-layer="9560" from-port="0" to-layer="9561" to-port="0" /> + <edge from-layer="9561" from-port="1" to-layer="9564" to-port="0" /> + <edge from-layer="9562" from-port="0" to-layer="9563" to-port="0" /> + <edge from-layer="9563" from-port="1" to-layer="9564" to-port="1" /> + <edge from-layer="9564" from-port="2" to-layer="9566" to-port="0" /> + <edge from-layer="9565" from-port="0" to-layer="9566" to-port="1" /> + <edge from-layer="9566" from-port="2" to-layer="9568" to-port="0" /> + <edge from-layer="9567" from-port="0" to-layer="9568" to-port="1" /> + <edge from-layer="9568" from-port="2" to-layer="9569" to-port="0" /> + <edge from-layer="9569" from-port="1" to-layer="9570" to-port="1" /> + <edge from-layer="9570" from-port="2" to-layer="9573" to-port="0" /> + <edge from-layer="9571" from-port="0" to-layer="9572" to-port="0" /> + <edge from-layer="9572" from-port="1" to-layer="9573" to-port="1" /> + <edge from-layer="9573" from-port="2" to-layer="9575" to-port="0" /> + <edge from-layer="9574" from-port="0" to-layer="9575" to-port="1" /> + <edge from-layer="9575" from-port="2" to-layer="9577" to-port="0" /> + <edge from-layer="9576" from-port="0" to-layer="9577" to-port="1" /> + <edge from-layer="9577" from-port="2" to-layer="9578" to-port="1" /> + <edge from-layer="9578" from-port="2" to-layer="9579" to-port="0" /> + <edge from-layer="9578" from-port="2" to-layer="9580" to-port="0" /> + <edge from-layer="9578" from-port="2" to-layer="11155" to-port="0" /> + <edge from-layer="9579" from-port="2" to-layer="9589" to-port="0" /> + <edge from-layer="9580" from-port="1" to-layer="9583" to-port="0" /> + <edge from-layer="9580" from-port="1" to-layer="9587" to-port="0" /> + <edge from-layer="9581" from-port="0" to-layer="9583" to-port="1" /> + <edge from-layer="9582" from-port="0" to-layer="9583" to-port="2" /> + <edge from-layer="9583" from-port="3" to-layer="9588" to-port="1" /> + <edge from-layer="9584" from-port="0" to-layer="9588" to-port="2" /> + <edge from-layer="9585" from-port="0" to-layer="9587" to-port="1" /> + <edge from-layer="9586" from-port="0" to-layer="9587" to-port="2" /> + <edge from-layer="9587" from-port="3" to-layer="9588" to-port="3" /> + <edge from-layer="9588" from-port="4" to-layer="9589" to-port="1" /> + <edge from-layer="9589" from-port="2" to-layer="9591" to-port="0" /> + <edge from-layer="9590" from-port="0" to-layer="9591" to-port="1" /> + <edge from-layer="9591" from-port="2" to-layer="9605" to-port="2" /> + <edge from-layer="9592" from-port="0" to-layer="9604" to-port="1" /> + <edge from-layer="9593" from-port="1" to-layer="9596" to-port="0" /> + <edge from-layer="9594" from-port="0" to-layer="9596" to-port="1" /> + <edge from-layer="9595" from-port="0" to-layer="9596" to-port="2" /> + <edge from-layer="9596" from-port="3" to-layer="9601" to-port="0" /> + <edge from-layer="9597" from-port="1" to-layer="9600" to-port="0" /> + <edge from-layer="9598" from-port="0" to-layer="9600" to-port="1" /> + <edge from-layer="9599" from-port="0" to-layer="9600" to-port="2" /> + <edge from-layer="9600" from-port="3" to-layer="9601" to-port="1" /> + <edge from-layer="9601" from-port="2" to-layer="9604" to-port="2" /> + <edge from-layer="9602" from-port="0" to-layer="9604" to-port="3" /> + <edge from-layer="9603" from-port="0" to-layer="9604" to-port="4" /> + <edge from-layer="9604" from-port="5" to-layer="9605" to-port="3" /> + <edge from-layer="9605" from-port="4" to-layer="9607" to-port="0" /> + <edge from-layer="9606" from-port="0" to-layer="9607" to-port="1" /> + <edge from-layer="9607" from-port="2" to-layer="9609" to-port="0" /> + <edge from-layer="9608" from-port="0" to-layer="9609" to-port="1" /> + <edge from-layer="9609" from-port="2" to-layer="9620" to-port="0" /> + <edge from-layer="9610" from-port="0" to-layer="9611" to-port="0" /> + <edge from-layer="9611" from-port="1" to-layer="9614" to-port="0" /> + <edge from-layer="9612" from-port="0" to-layer="9613" to-port="0" /> + <edge from-layer="9613" from-port="1" to-layer="9614" to-port="1" /> + <edge from-layer="9614" from-port="2" to-layer="9616" to-port="0" /> + <edge from-layer="9615" from-port="0" to-layer="9616" to-port="1" /> + <edge from-layer="9616" from-port="2" to-layer="9618" to-port="0" /> + <edge from-layer="9617" from-port="0" to-layer="9618" to-port="1" /> + <edge from-layer="9618" from-port="2" to-layer="9619" to-port="0" /> + <edge from-layer="9619" from-port="1" to-layer="9620" to-port="1" /> + <edge from-layer="9620" from-port="2" to-layer="9621" to-port="1" /> + <edge from-layer="9621" from-port="2" to-layer="9669" to-port="0" /> + <edge from-layer="9621" from-port="2" to-layer="9632" to-port="0" /> + <edge from-layer="9621" from-port="2" to-layer="9625" to-port="0" /> + <edge from-layer="9622" from-port="0" to-layer="9633" to-port="0" /> + <edge from-layer="9623" from-port="0" to-layer="9631" to-port="0" /> + <edge from-layer="9624" from-port="0" to-layer="9625" to-port="1" /> + <edge from-layer="9625" from-port="2" to-layer="9627" to-port="0" /> + <edge from-layer="9626" from-port="0" to-layer="9627" to-port="1" /> + <edge from-layer="9627" from-port="2" to-layer="9629" to-port="0" /> + <edge from-layer="9628" from-port="0" to-layer="9629" to-port="1" /> + <edge from-layer="9629" from-port="2" to-layer="9630" to-port="0" /> + <edge from-layer="9630" from-port="1" to-layer="9631" to-port="1" /> + <edge from-layer="9631" from-port="2" to-layer="9632" to-port="1" /> + <edge from-layer="9632" from-port="2" to-layer="9633" to-port="1" /> + <edge from-layer="9633" from-port="2" to-layer="9656" to-port="0" /> + <edge from-layer="9633" from-port="2" to-layer="9644" to-port="0" /> + <edge from-layer="9634" from-port="0" to-layer="9635" to-port="0" /> + <edge from-layer="9635" from-port="1" to-layer="9638" to-port="0" /> + <edge from-layer="9636" from-port="0" to-layer="9637" to-port="0" /> + <edge from-layer="9637" from-port="1" to-layer="9638" to-port="1" /> + <edge from-layer="9638" from-port="2" to-layer="9640" to-port="0" /> + <edge from-layer="9639" from-port="0" to-layer="9640" to-port="1" /> + <edge from-layer="9640" from-port="2" to-layer="9642" to-port="0" /> + <edge from-layer="9641" from-port="0" to-layer="9642" to-port="1" /> + <edge from-layer="9642" from-port="2" to-layer="9643" to-port="0" /> + <edge from-layer="9643" from-port="1" to-layer="9644" to-port="1" /> + <edge from-layer="9644" from-port="2" to-layer="9645" to-port="0" /> + <edge from-layer="9645" from-port="1" to-layer="9657" to-port="0" /> + <edge from-layer="9646" from-port="0" to-layer="9647" to-port="0" /> + <edge from-layer="9647" from-port="1" to-layer="9650" to-port="0" /> + <edge from-layer="9648" from-port="0" to-layer="9649" to-port="0" /> + <edge from-layer="9649" from-port="1" to-layer="9650" to-port="1" /> + <edge from-layer="9650" from-port="2" to-layer="9652" to-port="0" /> + <edge from-layer="9651" from-port="0" to-layer="9652" to-port="1" /> + <edge from-layer="9652" from-port="2" to-layer="9654" to-port="0" /> + <edge from-layer="9653" from-port="0" to-layer="9654" to-port="1" /> + <edge from-layer="9654" from-port="2" to-layer="9655" to-port="0" /> + <edge from-layer="9655" from-port="1" to-layer="9656" to-port="1" /> + <edge from-layer="9656" from-port="2" to-layer="9657" to-port="1" /> + <edge from-layer="9657" from-port="2" to-layer="9668" to-port="0" /> + <edge from-layer="9658" from-port="0" to-layer="9659" to-port="0" /> + <edge from-layer="9659" from-port="1" to-layer="9662" to-port="0" /> + <edge from-layer="9660" from-port="0" to-layer="9661" to-port="0" /> + <edge from-layer="9661" from-port="1" to-layer="9662" to-port="1" /> + <edge from-layer="9662" from-port="2" to-layer="9664" to-port="0" /> + <edge from-layer="9663" from-port="0" to-layer="9664" to-port="1" /> + <edge from-layer="9664" from-port="2" to-layer="9666" to-port="0" /> + <edge from-layer="9665" from-port="0" to-layer="9666" to-port="1" /> + <edge from-layer="9666" from-port="2" to-layer="9667" to-port="0" /> + <edge from-layer="9667" from-port="1" to-layer="9668" to-port="1" /> + <edge from-layer="9668" from-port="2" to-layer="9669" to-port="1" /> + <edge from-layer="9669" from-port="2" to-layer="9853" to-port="0" /> + <edge from-layer="9669" from-port="2" to-layer="9673" to-port="0" /> + <edge from-layer="9669" from-port="2" to-layer="9680" to-port="0" /> + <edge from-layer="9670" from-port="0" to-layer="9681" to-port="0" /> + <edge from-layer="9671" from-port="0" to-layer="9679" to-port="0" /> + <edge from-layer="9672" from-port="0" to-layer="9673" to-port="1" /> + <edge from-layer="9673" from-port="2" to-layer="9675" to-port="0" /> + <edge from-layer="9674" from-port="0" to-layer="9675" to-port="1" /> + <edge from-layer="9675" from-port="2" to-layer="9677" to-port="0" /> + <edge from-layer="9676" from-port="0" to-layer="9677" to-port="1" /> + <edge from-layer="9677" from-port="2" to-layer="9678" to-port="0" /> + <edge from-layer="9678" from-port="1" to-layer="9679" to-port="1" /> + <edge from-layer="9679" from-port="2" to-layer="9680" to-port="1" /> + <edge from-layer="9680" from-port="2" to-layer="9681" to-port="1" /> + <edge from-layer="9681" from-port="2" to-layer="9802" to-port="0" /> + <edge from-layer="9681" from-port="2" to-layer="9740" to-port="0" /> + <edge from-layer="9681" from-port="2" to-layer="9692" to-port="0" /> + <edge from-layer="9682" from-port="0" to-layer="9683" to-port="0" /> + <edge from-layer="9683" from-port="1" to-layer="9686" to-port="0" /> + <edge from-layer="9684" from-port="0" to-layer="9685" to-port="0" /> + <edge from-layer="9685" from-port="1" to-layer="9686" to-port="1" /> + <edge from-layer="9686" from-port="2" to-layer="9688" to-port="0" /> + <edge from-layer="9687" from-port="0" to-layer="9688" to-port="1" /> + <edge from-layer="9688" from-port="2" to-layer="9690" to-port="0" /> + <edge from-layer="9689" from-port="0" to-layer="9690" to-port="1" /> + <edge from-layer="9690" from-port="2" to-layer="9691" to-port="0" /> + <edge from-layer="9691" from-port="1" to-layer="9692" to-port="1" /> + <edge from-layer="9692" from-port="2" to-layer="9695" to-port="0" /> + <edge from-layer="9693" from-port="0" to-layer="9694" to-port="0" /> + <edge from-layer="9694" from-port="1" to-layer="9695" to-port="1" /> + <edge from-layer="9695" from-port="2" to-layer="9697" to-port="0" /> + <edge from-layer="9696" from-port="0" to-layer="9697" to-port="1" /> + <edge from-layer="9697" from-port="2" to-layer="9699" to-port="0" /> + <edge from-layer="9698" from-port="0" to-layer="9699" to-port="1" /> + <edge from-layer="9699" from-port="2" to-layer="9701" to-port="0" /> + <edge from-layer="9699" from-port="2" to-layer="9700" to-port="0" /> + <edge from-layer="9699" from-port="2" to-layer="9717" to-port="0" /> + <edge from-layer="9699" from-port="2" to-layer="9711" to-port="0" /> + <edge from-layer="9700" from-port="2" to-layer="9720" to-port="0" /> + <edge from-layer="9701" from-port="1" to-layer="9703" to-port="0" /> + <edge from-layer="9702" from-port="0" to-layer="9703" to-port="2" /> + <edge from-layer="9703" from-port="3" to-layer="9704" to-port="0" /> + <edge from-layer="9704" from-port="2" to-layer="9705" to-port="0" /> + <edge from-layer="9705" from-port="1" to-layer="9707" to-port="0" /> + <edge from-layer="9706" from-port="0" to-layer="9707" to-port="1" /> + <edge from-layer="9707" from-port="2" to-layer="9717" to-port="2" /> + <edge from-layer="9707" from-port="2" to-layer="9711" to-port="1" /> + <edge from-layer="9708" from-port="0" to-layer="9711" to-port="2" /> + <edge from-layer="9709" from-port="0" to-layer="9711" to-port="3" /> + <edge from-layer="9710" from-port="0" to-layer="9711" to-port="4" /> + <edge from-layer="9711" from-port="5" to-layer="9713" to-port="0" /> + <edge from-layer="9712" from-port="0" to-layer="9713" to-port="1" /> + <edge from-layer="9713" from-port="2" to-layer="9718" to-port="0" /> + <edge from-layer="9714" from-port="0" to-layer="9717" to-port="1" /> + <edge from-layer="9715" from-port="0" to-layer="9717" to-port="3" /> + <edge from-layer="9716" from-port="0" to-layer="9717" to-port="4" /> + <edge from-layer="9717" from-port="5" to-layer="9718" to-port="1" /> + <edge from-layer="9718" from-port="2" to-layer="9719" to-port="0" /> + <edge from-layer="9719" from-port="2" to-layer="9720" to-port="1" /> + <edge from-layer="9720" from-port="2" to-layer="9837" to-port="0" /> + <edge from-layer="9721" from-port="0" to-layer="9726" to-port="0" /> + <edge from-layer="9722" from-port="0" to-layer="9725" to-port="1" /> + <edge from-layer="9723" from-port="0" to-layer="9725" to-port="2" /> + <edge from-layer="9724" from-port="0" to-layer="9725" to-port="3" /> + <edge from-layer="9725" from-port="4" to-layer="9726" to-port="1" /> + <edge from-layer="9726" from-port="2" to-layer="9727" to-port="0" /> + <edge from-layer="9727" from-port="1" to-layer="9729" to-port="0" /> + <edge from-layer="9728" from-port="0" to-layer="9729" to-port="2" /> + <edge from-layer="9729" from-port="3" to-layer="9825" to-port="0" /> + <edge from-layer="9729" from-port="3" to-layer="9769" to-port="0" /> + <edge from-layer="9730" from-port="0" to-layer="9731" to-port="0" /> + <edge from-layer="9731" from-port="1" to-layer="9734" to-port="0" /> + <edge from-layer="9732" from-port="0" to-layer="9733" to-port="0" /> + <edge from-layer="9733" from-port="1" to-layer="9734" to-port="1" /> + <edge from-layer="9734" from-port="2" to-layer="9736" to-port="0" /> + <edge from-layer="9735" from-port="0" to-layer="9736" to-port="1" /> + <edge from-layer="9736" from-port="2" to-layer="9738" to-port="0" /> + <edge from-layer="9737" from-port="0" to-layer="9738" to-port="1" /> + <edge from-layer="9738" from-port="2" to-layer="9739" to-port="0" /> + <edge from-layer="9739" from-port="1" to-layer="9740" to-port="1" /> + <edge from-layer="9740" from-port="2" to-layer="9743" to-port="0" /> + <edge from-layer="9741" from-port="0" to-layer="9742" to-port="0" /> + <edge from-layer="9742" from-port="1" to-layer="9743" to-port="1" /> + <edge from-layer="9743" from-port="2" to-layer="9745" to-port="0" /> + <edge from-layer="9744" from-port="0" to-layer="9745" to-port="1" /> + <edge from-layer="9745" from-port="2" to-layer="9747" to-port="0" /> + <edge from-layer="9746" from-port="0" to-layer="9747" to-port="1" /> + <edge from-layer="9747" from-port="2" to-layer="9748" to-port="0" /> + <edge from-layer="9747" from-port="2" to-layer="9749" to-port="0" /> + <edge from-layer="9747" from-port="2" to-layer="9759" to-port="0" /> + <edge from-layer="9747" from-port="2" to-layer="9765" to-port="0" /> + <edge from-layer="9748" from-port="2" to-layer="9768" to-port="0" /> + <edge from-layer="9749" from-port="1" to-layer="9751" to-port="0" /> + <edge from-layer="9750" from-port="0" to-layer="9751" to-port="2" /> + <edge from-layer="9751" from-port="3" to-layer="9752" to-port="0" /> + <edge from-layer="9752" from-port="2" to-layer="9753" to-port="0" /> + <edge from-layer="9753" from-port="1" to-layer="9755" to-port="0" /> + <edge from-layer="9754" from-port="0" to-layer="9755" to-port="1" /> + <edge from-layer="9755" from-port="2" to-layer="9759" to-port="1" /> + <edge from-layer="9755" from-port="2" to-layer="9765" to-port="2" /> + <edge from-layer="9756" from-port="0" to-layer="9759" to-port="2" /> + <edge from-layer="9757" from-port="0" to-layer="9759" to-port="3" /> + <edge from-layer="9758" from-port="0" to-layer="9759" to-port="4" /> + <edge from-layer="9759" from-port="5" to-layer="9761" to-port="0" /> + <edge from-layer="9760" from-port="0" to-layer="9761" to-port="1" /> + <edge from-layer="9761" from-port="2" to-layer="9766" to-port="0" /> + <edge from-layer="9762" from-port="0" to-layer="9765" to-port="1" /> + <edge from-layer="9763" from-port="0" to-layer="9765" to-port="3" /> + <edge from-layer="9764" from-port="0" to-layer="9765" to-port="4" /> + <edge from-layer="9765" from-port="5" to-layer="9766" to-port="1" /> + <edge from-layer="9766" from-port="2" to-layer="9767" to-port="0" /> + <edge from-layer="9767" from-port="2" to-layer="9768" to-port="1" /> + <edge from-layer="9768" from-port="2" to-layer="9829" to-port="0" /> + <edge from-layer="9768" from-port="2" to-layer="9769" to-port="1" /> + <edge from-layer="9769" from-port="2" to-layer="11154" to-port="0" /> + <edge from-layer="9769" from-port="2" to-layer="9771" to-port="0" /> + <edge from-layer="9769" from-port="2" to-layer="9770" to-port="0" /> + <edge from-layer="9770" from-port="2" to-layer="9780" to-port="0" /> + <edge from-layer="9771" from-port="1" to-layer="9778" to-port="0" /> + <edge from-layer="9771" from-port="1" to-layer="9774" to-port="0" /> + <edge from-layer="9772" from-port="0" to-layer="9774" to-port="1" /> + <edge from-layer="9773" from-port="0" to-layer="9774" to-port="2" /> + <edge from-layer="9774" from-port="3" to-layer="9779" to-port="0" /> + <edge from-layer="9775" from-port="0" to-layer="9779" to-port="1" /> + <edge from-layer="9776" from-port="0" to-layer="9778" to-port="1" /> + <edge from-layer="9777" from-port="0" to-layer="9778" to-port="2" /> + <edge from-layer="9778" from-port="3" to-layer="9779" to-port="2" /> + <edge from-layer="9779" from-port="3" to-layer="9780" to-port="1" /> + <edge from-layer="9780" from-port="2" to-layer="9782" to-port="0" /> + <edge from-layer="9781" from-port="0" to-layer="9782" to-port="1" /> + <edge from-layer="9782" from-port="2" to-layer="9837" to-port="1" /> + <edge from-layer="9783" from-port="0" to-layer="9788" to-port="0" /> + <edge from-layer="9784" from-port="0" to-layer="9787" to-port="1" /> + <edge from-layer="9785" from-port="0" to-layer="9787" to-port="2" /> + <edge from-layer="9786" from-port="0" to-layer="9787" to-port="3" /> + <edge from-layer="9787" from-port="4" to-layer="9788" to-port="1" /> + <edge from-layer="9788" from-port="2" to-layer="9789" to-port="0" /> + <edge from-layer="9789" from-port="1" to-layer="9791" to-port="0" /> + <edge from-layer="9790" from-port="0" to-layer="9791" to-port="2" /> + <edge from-layer="9791" from-port="3" to-layer="9810" to-port="0" /> + <edge from-layer="9792" from-port="0" to-layer="9793" to-port="0" /> + <edge from-layer="9793" from-port="1" to-layer="9796" to-port="0" /> + <edge from-layer="9794" from-port="0" to-layer="9795" to-port="0" /> + <edge from-layer="9795" from-port="1" to-layer="9796" to-port="1" /> + <edge from-layer="9796" from-port="2" to-layer="9798" to-port="0" /> + <edge from-layer="9797" from-port="0" to-layer="9798" to-port="1" /> + <edge from-layer="9798" from-port="2" to-layer="9800" to-port="0" /> + <edge from-layer="9799" from-port="0" to-layer="9800" to-port="1" /> + <edge from-layer="9800" from-port="2" to-layer="9801" to-port="0" /> + <edge from-layer="9801" from-port="1" to-layer="9802" to-port="1" /> + <edge from-layer="9802" from-port="2" to-layer="9805" to-port="0" /> + <edge from-layer="9803" from-port="0" to-layer="9804" to-port="0" /> + <edge from-layer="9804" from-port="1" to-layer="9805" to-port="1" /> + <edge from-layer="9805" from-port="2" to-layer="9807" to-port="0" /> + <edge from-layer="9806" from-port="0" to-layer="9807" to-port="1" /> + <edge from-layer="9807" from-port="2" to-layer="9809" to-port="0" /> + <edge from-layer="9808" from-port="0" to-layer="9809" to-port="1" /> + <edge from-layer="9809" from-port="2" to-layer="9810" to-port="1" /> + <edge from-layer="9810" from-port="2" to-layer="9812" to-port="0" /> + <edge from-layer="9810" from-port="2" to-layer="9811" to-port="0" /> + <edge from-layer="9810" from-port="2" to-layer="11153" to-port="0" /> + <edge from-layer="9811" from-port="2" to-layer="9821" to-port="0" /> + <edge from-layer="9812" from-port="1" to-layer="9819" to-port="0" /> + <edge from-layer="9812" from-port="1" to-layer="9815" to-port="0" /> + <edge from-layer="9813" from-port="0" to-layer="9815" to-port="1" /> + <edge from-layer="9814" from-port="0" to-layer="9815" to-port="2" /> + <edge from-layer="9815" from-port="3" to-layer="9820" to-port="1" /> + <edge from-layer="9816" from-port="0" to-layer="9820" to-port="2" /> + <edge from-layer="9817" from-port="0" to-layer="9819" to-port="1" /> + <edge from-layer="9818" from-port="0" to-layer="9819" to-port="2" /> + <edge from-layer="9819" from-port="3" to-layer="9820" to-port="3" /> + <edge from-layer="9820" from-port="4" to-layer="9821" to-port="1" /> + <edge from-layer="9821" from-port="2" to-layer="9823" to-port="0" /> + <edge from-layer="9822" from-port="0" to-layer="9823" to-port="1" /> + <edge from-layer="9823" from-port="2" to-layer="9837" to-port="2" /> + <edge from-layer="9824" from-port="0" to-layer="9836" to-port="1" /> + <edge from-layer="9825" from-port="1" to-layer="9828" to-port="0" /> + <edge from-layer="9826" from-port="0" to-layer="9828" to-port="1" /> + <edge from-layer="9827" from-port="0" to-layer="9828" to-port="2" /> + <edge from-layer="9828" from-port="3" to-layer="9833" to-port="0" /> + <edge from-layer="9829" from-port="1" to-layer="9832" to-port="0" /> + <edge from-layer="9830" from-port="0" to-layer="9832" to-port="1" /> + <edge from-layer="9831" from-port="0" to-layer="9832" to-port="2" /> + <edge from-layer="9832" from-port="3" to-layer="9833" to-port="1" /> + <edge from-layer="9833" from-port="2" to-layer="9836" to-port="2" /> + <edge from-layer="9834" from-port="0" to-layer="9836" to-port="3" /> + <edge from-layer="9835" from-port="0" to-layer="9836" to-port="4" /> + <edge from-layer="9836" from-port="5" to-layer="9837" to-port="3" /> + <edge from-layer="9837" from-port="4" to-layer="9839" to-port="0" /> + <edge from-layer="9838" from-port="0" to-layer="9839" to-port="1" /> + <edge from-layer="9839" from-port="2" to-layer="9841" to-port="0" /> + <edge from-layer="9840" from-port="0" to-layer="9841" to-port="1" /> + <edge from-layer="9841" from-port="2" to-layer="9852" to-port="0" /> + <edge from-layer="9842" from-port="0" to-layer="9843" to-port="0" /> + <edge from-layer="9843" from-port="1" to-layer="9846" to-port="0" /> + <edge from-layer="9844" from-port="0" to-layer="9845" to-port="0" /> + <edge from-layer="9845" from-port="1" to-layer="9846" to-port="1" /> + <edge from-layer="9846" from-port="2" to-layer="9848" to-port="0" /> + <edge from-layer="9847" from-port="0" to-layer="9848" to-port="1" /> + <edge from-layer="9848" from-port="2" to-layer="9850" to-port="0" /> + <edge from-layer="9849" from-port="0" to-layer="9850" to-port="1" /> + <edge from-layer="9850" from-port="2" to-layer="9851" to-port="0" /> + <edge from-layer="9851" from-port="1" to-layer="9852" to-port="1" /> + <edge from-layer="9852" from-port="2" to-layer="9853" to-port="1" /> + <edge from-layer="9853" from-port="2" to-layer="9901" to-port="0" /> + <edge from-layer="9853" from-port="2" to-layer="9857" to-port="0" /> + <edge from-layer="9853" from-port="2" to-layer="9864" to-port="0" /> + <edge from-layer="9854" from-port="0" to-layer="9865" to-port="0" /> + <edge from-layer="9855" from-port="0" to-layer="9863" to-port="0" /> + <edge from-layer="9856" from-port="0" to-layer="9857" to-port="1" /> + <edge from-layer="9857" from-port="2" to-layer="9859" to-port="0" /> + <edge from-layer="9858" from-port="0" to-layer="9859" to-port="1" /> + <edge from-layer="9859" from-port="2" to-layer="9861" to-port="0" /> + <edge from-layer="9860" from-port="0" to-layer="9861" to-port="1" /> + <edge from-layer="9861" from-port="2" to-layer="9862" to-port="0" /> + <edge from-layer="9862" from-port="1" to-layer="9863" to-port="1" /> + <edge from-layer="9863" from-port="2" to-layer="9864" to-port="1" /> + <edge from-layer="9864" from-port="2" to-layer="9865" to-port="1" /> + <edge from-layer="9865" from-port="2" to-layer="9888" to-port="0" /> + <edge from-layer="9865" from-port="2" to-layer="9876" to-port="0" /> + <edge from-layer="9866" from-port="0" to-layer="9867" to-port="0" /> + <edge from-layer="9867" from-port="1" to-layer="9870" to-port="0" /> + <edge from-layer="9868" from-port="0" to-layer="9869" to-port="0" /> + <edge from-layer="9869" from-port="1" to-layer="9870" to-port="1" /> + <edge from-layer="9870" from-port="2" to-layer="9872" to-port="0" /> + <edge from-layer="9871" from-port="0" to-layer="9872" to-port="1" /> + <edge from-layer="9872" from-port="2" to-layer="9874" to-port="0" /> + <edge from-layer="9873" from-port="0" to-layer="9874" to-port="1" /> + <edge from-layer="9874" from-port="2" to-layer="9875" to-port="0" /> + <edge from-layer="9875" from-port="1" to-layer="9876" to-port="1" /> + <edge from-layer="9876" from-port="2" to-layer="9877" to-port="0" /> + <edge from-layer="9877" from-port="1" to-layer="9889" to-port="0" /> + <edge from-layer="9878" from-port="0" to-layer="9879" to-port="0" /> + <edge from-layer="9879" from-port="1" to-layer="9882" to-port="0" /> + <edge from-layer="9880" from-port="0" to-layer="9881" to-port="0" /> + <edge from-layer="9881" from-port="1" to-layer="9882" to-port="1" /> + <edge from-layer="9882" from-port="2" to-layer="9884" to-port="0" /> + <edge from-layer="9883" from-port="0" to-layer="9884" to-port="1" /> + <edge from-layer="9884" from-port="2" to-layer="9886" to-port="0" /> + <edge from-layer="9885" from-port="0" to-layer="9886" to-port="1" /> + <edge from-layer="9886" from-port="2" to-layer="9887" to-port="0" /> + <edge from-layer="9887" from-port="1" to-layer="9888" to-port="1" /> + <edge from-layer="9888" from-port="2" to-layer="9889" to-port="1" /> + <edge from-layer="9889" from-port="2" to-layer="9900" to-port="0" /> + <edge from-layer="9890" from-port="0" to-layer="9891" to-port="0" /> + <edge from-layer="9891" from-port="1" to-layer="9894" to-port="0" /> + <edge from-layer="9892" from-port="0" to-layer="9893" to-port="0" /> + <edge from-layer="9893" from-port="1" to-layer="9894" to-port="1" /> + <edge from-layer="9894" from-port="2" to-layer="9896" to-port="0" /> + <edge from-layer="9895" from-port="0" to-layer="9896" to-port="1" /> + <edge from-layer="9896" from-port="2" to-layer="9898" to-port="0" /> + <edge from-layer="9897" from-port="0" to-layer="9898" to-port="1" /> + <edge from-layer="9898" from-port="2" to-layer="9899" to-port="0" /> + <edge from-layer="9899" from-port="1" to-layer="9900" to-port="1" /> + <edge from-layer="9900" from-port="2" to-layer="9901" to-port="1" /> + <edge from-layer="9901" from-port="2" to-layer="10085" to-port="0" /> + <edge from-layer="9901" from-port="2" to-layer="9905" to-port="0" /> + <edge from-layer="9901" from-port="2" to-layer="9912" to-port="0" /> + <edge from-layer="9902" from-port="0" to-layer="9913" to-port="0" /> + <edge from-layer="9903" from-port="0" to-layer="9911" to-port="0" /> + <edge from-layer="9904" from-port="0" to-layer="9905" to-port="1" /> + <edge from-layer="9905" from-port="2" to-layer="9907" to-port="0" /> + <edge from-layer="9906" from-port="0" to-layer="9907" to-port="1" /> + <edge from-layer="9907" from-port="2" to-layer="9909" to-port="0" /> + <edge from-layer="9908" from-port="0" to-layer="9909" to-port="1" /> + <edge from-layer="9909" from-port="2" to-layer="9910" to-port="0" /> + <edge from-layer="9910" from-port="1" to-layer="9911" to-port="1" /> + <edge from-layer="9911" from-port="2" to-layer="9912" to-port="1" /> + <edge from-layer="9912" from-port="2" to-layer="9913" to-port="1" /> + <edge from-layer="9913" from-port="2" to-layer="9924" to-port="0" /> + <edge from-layer="9913" from-port="2" to-layer="9972" to-port="0" /> + <edge from-layer="9913" from-port="2" to-layer="10034" to-port="0" /> + <edge from-layer="9914" from-port="0" to-layer="9915" to-port="0" /> + <edge from-layer="9915" from-port="1" to-layer="9918" to-port="0" /> + <edge from-layer="9916" from-port="0" to-layer="9917" to-port="0" /> + <edge from-layer="9917" from-port="1" to-layer="9918" to-port="1" /> + <edge from-layer="9918" from-port="2" to-layer="9920" to-port="0" /> + <edge from-layer="9919" from-port="0" to-layer="9920" to-port="1" /> + <edge from-layer="9920" from-port="2" to-layer="9922" to-port="0" /> + <edge from-layer="9921" from-port="0" to-layer="9922" to-port="1" /> + <edge from-layer="9922" from-port="2" to-layer="9923" to-port="0" /> + <edge from-layer="9923" from-port="1" to-layer="9924" to-port="1" /> + <edge from-layer="9924" from-port="2" to-layer="9927" to-port="0" /> + <edge from-layer="9925" from-port="0" to-layer="9926" to-port="0" /> + <edge from-layer="9926" from-port="1" to-layer="9927" to-port="1" /> + <edge from-layer="9927" from-port="2" to-layer="9929" to-port="0" /> + <edge from-layer="9928" from-port="0" to-layer="9929" to-port="1" /> + <edge from-layer="9929" from-port="2" to-layer="9931" to-port="0" /> + <edge from-layer="9930" from-port="0" to-layer="9931" to-port="1" /> + <edge from-layer="9931" from-port="2" to-layer="9949" to-port="0" /> + <edge from-layer="9931" from-port="2" to-layer="9932" to-port="0" /> + <edge from-layer="9931" from-port="2" to-layer="9933" to-port="0" /> + <edge from-layer="9931" from-port="2" to-layer="9943" to-port="0" /> + <edge from-layer="9932" from-port="2" to-layer="9952" to-port="0" /> + <edge from-layer="9933" from-port="1" to-layer="9935" to-port="0" /> + <edge from-layer="9934" from-port="0" to-layer="9935" to-port="2" /> + <edge from-layer="9935" from-port="3" to-layer="9936" to-port="0" /> + <edge from-layer="9936" from-port="2" to-layer="9937" to-port="0" /> + <edge from-layer="9937" from-port="1" to-layer="9939" to-port="0" /> + <edge from-layer="9938" from-port="0" to-layer="9939" to-port="1" /> + <edge from-layer="9939" from-port="2" to-layer="9943" to-port="1" /> + <edge from-layer="9939" from-port="2" to-layer="9949" to-port="2" /> + <edge from-layer="9940" from-port="0" to-layer="9943" to-port="2" /> + <edge from-layer="9941" from-port="0" to-layer="9943" to-port="3" /> + <edge from-layer="9942" from-port="0" to-layer="9943" to-port="4" /> + <edge from-layer="9943" from-port="5" to-layer="9945" to-port="0" /> + <edge from-layer="9944" from-port="0" to-layer="9945" to-port="1" /> + <edge from-layer="9945" from-port="2" to-layer="9950" to-port="0" /> + <edge from-layer="9946" from-port="0" to-layer="9949" to-port="1" /> + <edge from-layer="9947" from-port="0" to-layer="9949" to-port="3" /> + <edge from-layer="9948" from-port="0" to-layer="9949" to-port="4" /> + <edge from-layer="9949" from-port="5" to-layer="9950" to-port="1" /> + <edge from-layer="9950" from-port="2" to-layer="9951" to-port="0" /> + <edge from-layer="9951" from-port="2" to-layer="9952" to-port="1" /> + <edge from-layer="9952" from-port="2" to-layer="10069" to-port="0" /> + <edge from-layer="9953" from-port="0" to-layer="9958" to-port="0" /> + <edge from-layer="9954" from-port="0" to-layer="9957" to-port="1" /> + <edge from-layer="9955" from-port="0" to-layer="9957" to-port="2" /> + <edge from-layer="9956" from-port="0" to-layer="9957" to-port="3" /> + <edge from-layer="9957" from-port="4" to-layer="9958" to-port="1" /> + <edge from-layer="9958" from-port="2" to-layer="9959" to-port="0" /> + <edge from-layer="9959" from-port="1" to-layer="9961" to-port="0" /> + <edge from-layer="9960" from-port="0" to-layer="9961" to-port="2" /> + <edge from-layer="9961" from-port="3" to-layer="10001" to-port="0" /> + <edge from-layer="9961" from-port="3" to-layer="10057" to-port="0" /> + <edge from-layer="9962" from-port="0" to-layer="9963" to-port="0" /> + <edge from-layer="9963" from-port="1" to-layer="9966" to-port="0" /> + <edge from-layer="9964" from-port="0" to-layer="9965" to-port="0" /> + <edge from-layer="9965" from-port="1" to-layer="9966" to-port="1" /> + <edge from-layer="9966" from-port="2" to-layer="9968" to-port="0" /> + <edge from-layer="9967" from-port="0" to-layer="9968" to-port="1" /> + <edge from-layer="9968" from-port="2" to-layer="9970" to-port="0" /> + <edge from-layer="9969" from-port="0" to-layer="9970" to-port="1" /> + <edge from-layer="9970" from-port="2" to-layer="9971" to-port="0" /> + <edge from-layer="9971" from-port="1" to-layer="9972" to-port="1" /> + <edge from-layer="9972" from-port="2" to-layer="9975" to-port="0" /> + <edge from-layer="9973" from-port="0" to-layer="9974" to-port="0" /> + <edge from-layer="9974" from-port="1" to-layer="9975" to-port="1" /> + <edge from-layer="9975" from-port="2" to-layer="9977" to-port="0" /> + <edge from-layer="9976" from-port="0" to-layer="9977" to-port="1" /> + <edge from-layer="9977" from-port="2" to-layer="9979" to-port="0" /> + <edge from-layer="9978" from-port="0" to-layer="9979" to-port="1" /> + <edge from-layer="9979" from-port="2" to-layer="9997" to-port="0" /> + <edge from-layer="9979" from-port="2" to-layer="9991" to-port="0" /> + <edge from-layer="9979" from-port="2" to-layer="9980" to-port="0" /> + <edge from-layer="9979" from-port="2" to-layer="9981" to-port="0" /> + <edge from-layer="9980" from-port="2" to-layer="10000" to-port="0" /> + <edge from-layer="9981" from-port="1" to-layer="9983" to-port="0" /> + <edge from-layer="9982" from-port="0" to-layer="9983" to-port="2" /> + <edge from-layer="9983" from-port="3" to-layer="9984" to-port="0" /> + <edge from-layer="9984" from-port="2" to-layer="9985" to-port="0" /> + <edge from-layer="9985" from-port="1" to-layer="9987" to-port="0" /> + <edge from-layer="9986" from-port="0" to-layer="9987" to-port="1" /> + <edge from-layer="9987" from-port="2" to-layer="9991" to-port="1" /> + <edge from-layer="9987" from-port="2" to-layer="9997" to-port="2" /> + <edge from-layer="9988" from-port="0" to-layer="9991" to-port="2" /> + <edge from-layer="9989" from-port="0" to-layer="9991" to-port="3" /> + <edge from-layer="9990" from-port="0" to-layer="9991" to-port="4" /> + <edge from-layer="9991" from-port="5" to-layer="9993" to-port="0" /> + <edge from-layer="9992" from-port="0" to-layer="9993" to-port="1" /> + <edge from-layer="9993" from-port="2" to-layer="9998" to-port="0" /> + <edge from-layer="9994" from-port="0" to-layer="9997" to-port="1" /> + <edge from-layer="9995" from-port="0" to-layer="9997" to-port="3" /> + <edge from-layer="9996" from-port="0" to-layer="9997" to-port="4" /> + <edge from-layer="9997" from-port="5" to-layer="9998" to-port="1" /> + <edge from-layer="9998" from-port="2" to-layer="9999" to-port="0" /> + <edge from-layer="9999" from-port="2" to-layer="10000" to-port="1" /> + <edge from-layer="10000" from-port="2" to-layer="10061" to-port="0" /> + <edge from-layer="10000" from-port="2" to-layer="10001" to-port="1" /> + <edge from-layer="10001" from-port="2" to-layer="11152" to-port="0" /> + <edge from-layer="10001" from-port="2" to-layer="10002" to-port="0" /> + <edge from-layer="10001" from-port="2" to-layer="10003" to-port="0" /> + <edge from-layer="10002" from-port="2" to-layer="10012" to-port="0" /> + <edge from-layer="10003" from-port="1" to-layer="10006" to-port="0" /> + <edge from-layer="10003" from-port="1" to-layer="10010" to-port="0" /> + <edge from-layer="10004" from-port="0" to-layer="10006" to-port="1" /> + <edge from-layer="10005" from-port="0" to-layer="10006" to-port="2" /> + <edge from-layer="10006" from-port="3" to-layer="10011" to-port="0" /> + <edge from-layer="10007" from-port="0" to-layer="10011" to-port="1" /> + <edge from-layer="10008" from-port="0" to-layer="10010" to-port="1" /> + <edge from-layer="10009" from-port="0" to-layer="10010" to-port="2" /> + <edge from-layer="10010" from-port="3" to-layer="10011" to-port="2" /> + <edge from-layer="10011" from-port="3" to-layer="10012" to-port="1" /> + <edge from-layer="10012" from-port="2" to-layer="10014" to-port="0" /> + <edge from-layer="10013" from-port="0" to-layer="10014" to-port="1" /> + <edge from-layer="10014" from-port="2" to-layer="10069" to-port="1" /> + <edge from-layer="10015" from-port="0" to-layer="10020" to-port="0" /> + <edge from-layer="10016" from-port="0" to-layer="10019" to-port="1" /> + <edge from-layer="10017" from-port="0" to-layer="10019" to-port="2" /> + <edge from-layer="10018" from-port="0" to-layer="10019" to-port="3" /> + <edge from-layer="10019" from-port="4" to-layer="10020" to-port="1" /> + <edge from-layer="10020" from-port="2" to-layer="10021" to-port="0" /> + <edge from-layer="10021" from-port="1" to-layer="10023" to-port="0" /> + <edge from-layer="10022" from-port="0" to-layer="10023" to-port="2" /> + <edge from-layer="10023" from-port="3" to-layer="10042" to-port="0" /> + <edge from-layer="10024" from-port="0" to-layer="10025" to-port="0" /> + <edge from-layer="10025" from-port="1" to-layer="10028" to-port="0" /> + <edge from-layer="10026" from-port="0" to-layer="10027" to-port="0" /> + <edge from-layer="10027" from-port="1" to-layer="10028" to-port="1" /> + <edge from-layer="10028" from-port="2" to-layer="10030" to-port="0" /> + <edge from-layer="10029" from-port="0" to-layer="10030" to-port="1" /> + <edge from-layer="10030" from-port="2" to-layer="10032" to-port="0" /> + <edge from-layer="10031" from-port="0" to-layer="10032" to-port="1" /> + <edge from-layer="10032" from-port="2" to-layer="10033" to-port="0" /> + <edge from-layer="10033" from-port="1" to-layer="10034" to-port="1" /> + <edge from-layer="10034" from-port="2" to-layer="10037" to-port="0" /> + <edge from-layer="10035" from-port="0" to-layer="10036" to-port="0" /> + <edge from-layer="10036" from-port="1" to-layer="10037" to-port="1" /> + <edge from-layer="10037" from-port="2" to-layer="10039" to-port="0" /> + <edge from-layer="10038" from-port="0" to-layer="10039" to-port="1" /> + <edge from-layer="10039" from-port="2" to-layer="10041" to-port="0" /> + <edge from-layer="10040" from-port="0" to-layer="10041" to-port="1" /> + <edge from-layer="10041" from-port="2" to-layer="10042" to-port="1" /> + <edge from-layer="10042" from-port="2" to-layer="11151" to-port="0" /> + <edge from-layer="10042" from-port="2" to-layer="10043" to-port="0" /> + <edge from-layer="10042" from-port="2" to-layer="10044" to-port="0" /> + <edge from-layer="10043" from-port="2" to-layer="10053" to-port="0" /> + <edge from-layer="10044" from-port="1" to-layer="10047" to-port="0" /> + <edge from-layer="10044" from-port="1" to-layer="10051" to-port="0" /> + <edge from-layer="10045" from-port="0" to-layer="10047" to-port="1" /> + <edge from-layer="10046" from-port="0" to-layer="10047" to-port="2" /> + <edge from-layer="10047" from-port="3" to-layer="10052" to-port="1" /> + <edge from-layer="10048" from-port="0" to-layer="10052" to-port="2" /> + <edge from-layer="10049" from-port="0" to-layer="10051" to-port="1" /> + <edge from-layer="10050" from-port="0" to-layer="10051" to-port="2" /> + <edge from-layer="10051" from-port="3" to-layer="10052" to-port="3" /> + <edge from-layer="10052" from-port="4" to-layer="10053" to-port="1" /> + <edge from-layer="10053" from-port="2" to-layer="10055" to-port="0" /> + <edge from-layer="10054" from-port="0" to-layer="10055" to-port="1" /> + <edge from-layer="10055" from-port="2" to-layer="10069" to-port="2" /> + <edge from-layer="10056" from-port="0" to-layer="10068" to-port="1" /> + <edge from-layer="10057" from-port="1" to-layer="10060" to-port="0" /> + <edge from-layer="10058" from-port="0" to-layer="10060" to-port="1" /> + <edge from-layer="10059" from-port="0" to-layer="10060" to-port="2" /> + <edge from-layer="10060" from-port="3" to-layer="10065" to-port="0" /> + <edge from-layer="10061" from-port="1" to-layer="10064" to-port="0" /> + <edge from-layer="10062" from-port="0" to-layer="10064" to-port="1" /> + <edge from-layer="10063" from-port="0" to-layer="10064" to-port="2" /> + <edge from-layer="10064" from-port="3" to-layer="10065" to-port="1" /> + <edge from-layer="10065" from-port="2" to-layer="10068" to-port="2" /> + <edge from-layer="10066" from-port="0" to-layer="10068" to-port="3" /> + <edge from-layer="10067" from-port="0" to-layer="10068" to-port="4" /> + <edge from-layer="10068" from-port="5" to-layer="10069" to-port="3" /> + <edge from-layer="10069" from-port="4" to-layer="10071" to-port="0" /> + <edge from-layer="10070" from-port="0" to-layer="10071" to-port="1" /> + <edge from-layer="10071" from-port="2" to-layer="10073" to-port="0" /> + <edge from-layer="10072" from-port="0" to-layer="10073" to-port="1" /> + <edge from-layer="10073" from-port="2" to-layer="10084" to-port="0" /> + <edge from-layer="10074" from-port="0" to-layer="10075" to-port="0" /> + <edge from-layer="10075" from-port="1" to-layer="10078" to-port="0" /> + <edge from-layer="10076" from-port="0" to-layer="10077" to-port="0" /> + <edge from-layer="10077" from-port="1" to-layer="10078" to-port="1" /> + <edge from-layer="10078" from-port="2" to-layer="10080" to-port="0" /> + <edge from-layer="10079" from-port="0" to-layer="10080" to-port="1" /> + <edge from-layer="10080" from-port="2" to-layer="10082" to-port="0" /> + <edge from-layer="10081" from-port="0" to-layer="10082" to-port="1" /> + <edge from-layer="10082" from-port="2" to-layer="10083" to-port="0" /> + <edge from-layer="10083" from-port="1" to-layer="10084" to-port="1" /> + <edge from-layer="10084" from-port="2" to-layer="10085" to-port="1" /> + <edge from-layer="10085" from-port="2" to-layer="10133" to-port="0" /> + <edge from-layer="10085" from-port="2" to-layer="10089" to-port="0" /> + <edge from-layer="10085" from-port="2" to-layer="10096" to-port="0" /> + <edge from-layer="10086" from-port="0" to-layer="10097" to-port="0" /> + <edge from-layer="10087" from-port="0" to-layer="10095" to-port="0" /> + <edge from-layer="10088" from-port="0" to-layer="10089" to-port="1" /> + <edge from-layer="10089" from-port="2" to-layer="10091" to-port="0" /> + <edge from-layer="10090" from-port="0" to-layer="10091" to-port="1" /> + <edge from-layer="10091" from-port="2" to-layer="10093" to-port="0" /> + <edge from-layer="10092" from-port="0" to-layer="10093" to-port="1" /> + <edge from-layer="10093" from-port="2" to-layer="10094" to-port="0" /> + <edge from-layer="10094" from-port="1" to-layer="10095" to-port="1" /> + <edge from-layer="10095" from-port="2" to-layer="10096" to-port="1" /> + <edge from-layer="10096" from-port="2" to-layer="10097" to-port="1" /> + <edge from-layer="10097" from-port="2" to-layer="10120" to-port="0" /> + <edge from-layer="10097" from-port="2" to-layer="10108" to-port="0" /> + <edge from-layer="10098" from-port="0" to-layer="10099" to-port="0" /> + <edge from-layer="10099" from-port="1" to-layer="10102" to-port="0" /> + <edge from-layer="10100" from-port="0" to-layer="10101" to-port="0" /> + <edge from-layer="10101" from-port="1" to-layer="10102" to-port="1" /> + <edge from-layer="10102" from-port="2" to-layer="10104" to-port="0" /> + <edge from-layer="10103" from-port="0" to-layer="10104" to-port="1" /> + <edge from-layer="10104" from-port="2" to-layer="10106" to-port="0" /> + <edge from-layer="10105" from-port="0" to-layer="10106" to-port="1" /> + <edge from-layer="10106" from-port="2" to-layer="10107" to-port="0" /> + <edge from-layer="10107" from-port="1" to-layer="10108" to-port="1" /> + <edge from-layer="10108" from-port="2" to-layer="10109" to-port="0" /> + <edge from-layer="10109" from-port="1" to-layer="10121" to-port="0" /> + <edge from-layer="10110" from-port="0" to-layer="10111" to-port="0" /> + <edge from-layer="10111" from-port="1" to-layer="10114" to-port="0" /> + <edge from-layer="10112" from-port="0" to-layer="10113" to-port="0" /> + <edge from-layer="10113" from-port="1" to-layer="10114" to-port="1" /> + <edge from-layer="10114" from-port="2" to-layer="10116" to-port="0" /> + <edge from-layer="10115" from-port="0" to-layer="10116" to-port="1" /> + <edge from-layer="10116" from-port="2" to-layer="10118" to-port="0" /> + <edge from-layer="10117" from-port="0" to-layer="10118" to-port="1" /> + <edge from-layer="10118" from-port="2" to-layer="10119" to-port="0" /> + <edge from-layer="10119" from-port="1" to-layer="10120" to-port="1" /> + <edge from-layer="10120" from-port="2" to-layer="10121" to-port="1" /> + <edge from-layer="10121" from-port="2" to-layer="10132" to-port="0" /> + <edge from-layer="10122" from-port="0" to-layer="10123" to-port="0" /> + <edge from-layer="10123" from-port="1" to-layer="10126" to-port="0" /> + <edge from-layer="10124" from-port="0" to-layer="10125" to-port="0" /> + <edge from-layer="10125" from-port="1" to-layer="10126" to-port="1" /> + <edge from-layer="10126" from-port="2" to-layer="10128" to-port="0" /> + <edge from-layer="10127" from-port="0" to-layer="10128" to-port="1" /> + <edge from-layer="10128" from-port="2" to-layer="10130" to-port="0" /> + <edge from-layer="10129" from-port="0" to-layer="10130" to-port="1" /> + <edge from-layer="10130" from-port="2" to-layer="10131" to-port="0" /> + <edge from-layer="10131" from-port="1" to-layer="10132" to-port="1" /> + <edge from-layer="10132" from-port="2" to-layer="10133" to-port="1" /> + <edge from-layer="10133" from-port="2" to-layer="10317" to-port="0" /> + <edge from-layer="10133" from-port="2" to-layer="10144" to-port="0" /> + <edge from-layer="10133" from-port="2" to-layer="10137" to-port="0" /> + <edge from-layer="10134" from-port="0" to-layer="10145" to-port="0" /> + <edge from-layer="10135" from-port="0" to-layer="10143" to-port="0" /> + <edge from-layer="10136" from-port="0" to-layer="10137" to-port="1" /> + <edge from-layer="10137" from-port="2" to-layer="10139" to-port="0" /> + <edge from-layer="10138" from-port="0" to-layer="10139" to-port="1" /> + <edge from-layer="10139" from-port="2" to-layer="10141" to-port="0" /> + <edge from-layer="10140" from-port="0" to-layer="10141" to-port="1" /> + <edge from-layer="10141" from-port="2" to-layer="10142" to-port="0" /> + <edge from-layer="10142" from-port="1" to-layer="10143" to-port="1" /> + <edge from-layer="10143" from-port="2" to-layer="10144" to-port="1" /> + <edge from-layer="10144" from-port="2" to-layer="10145" to-port="1" /> + <edge from-layer="10145" from-port="2" to-layer="10156" to-port="0" /> + <edge from-layer="10145" from-port="2" to-layer="10266" to-port="0" /> + <edge from-layer="10145" from-port="2" to-layer="10204" to-port="0" /> + <edge from-layer="10146" from-port="0" to-layer="10147" to-port="0" /> + <edge from-layer="10147" from-port="1" to-layer="10150" to-port="0" /> + <edge from-layer="10148" from-port="0" to-layer="10149" to-port="0" /> + <edge from-layer="10149" from-port="1" to-layer="10150" to-port="1" /> + <edge from-layer="10150" from-port="2" to-layer="10152" to-port="0" /> + <edge from-layer="10151" from-port="0" to-layer="10152" to-port="1" /> + <edge from-layer="10152" from-port="2" to-layer="10154" to-port="0" /> + <edge from-layer="10153" from-port="0" to-layer="10154" to-port="1" /> + <edge from-layer="10154" from-port="2" to-layer="10155" to-port="0" /> + <edge from-layer="10155" from-port="1" to-layer="10156" to-port="1" /> + <edge from-layer="10156" from-port="2" to-layer="10159" to-port="0" /> + <edge from-layer="10157" from-port="0" to-layer="10158" to-port="0" /> + <edge from-layer="10158" from-port="1" to-layer="10159" to-port="1" /> + <edge from-layer="10159" from-port="2" to-layer="10161" to-port="0" /> + <edge from-layer="10160" from-port="0" to-layer="10161" to-port="1" /> + <edge from-layer="10161" from-port="2" to-layer="10163" to-port="0" /> + <edge from-layer="10162" from-port="0" to-layer="10163" to-port="1" /> + <edge from-layer="10163" from-port="2" to-layer="10181" to-port="0" /> + <edge from-layer="10163" from-port="2" to-layer="10175" to-port="0" /> + <edge from-layer="10163" from-port="2" to-layer="10165" to-port="0" /> + <edge from-layer="10163" from-port="2" to-layer="10164" to-port="0" /> + <edge from-layer="10164" from-port="2" to-layer="10184" to-port="0" /> + <edge from-layer="10165" from-port="1" to-layer="10167" to-port="0" /> + <edge from-layer="10166" from-port="0" to-layer="10167" to-port="2" /> + <edge from-layer="10167" from-port="3" to-layer="10168" to-port="0" /> + <edge from-layer="10168" from-port="2" to-layer="10169" to-port="0" /> + <edge from-layer="10169" from-port="1" to-layer="10171" to-port="0" /> + <edge from-layer="10170" from-port="0" to-layer="10171" to-port="1" /> + <edge from-layer="10171" from-port="2" to-layer="10181" to-port="2" /> + <edge from-layer="10171" from-port="2" to-layer="10175" to-port="1" /> + <edge from-layer="10172" from-port="0" to-layer="10175" to-port="2" /> + <edge from-layer="10173" from-port="0" to-layer="10175" to-port="3" /> + <edge from-layer="10174" from-port="0" to-layer="10175" to-port="4" /> + <edge from-layer="10175" from-port="5" to-layer="10177" to-port="0" /> + <edge from-layer="10176" from-port="0" to-layer="10177" to-port="1" /> + <edge from-layer="10177" from-port="2" to-layer="10182" to-port="0" /> + <edge from-layer="10178" from-port="0" to-layer="10181" to-port="1" /> + <edge from-layer="10179" from-port="0" to-layer="10181" to-port="3" /> + <edge from-layer="10180" from-port="0" to-layer="10181" to-port="4" /> + <edge from-layer="10181" from-port="5" to-layer="10182" to-port="1" /> + <edge from-layer="10182" from-port="2" to-layer="10183" to-port="0" /> + <edge from-layer="10183" from-port="2" to-layer="10184" to-port="1" /> + <edge from-layer="10184" from-port="2" to-layer="10301" to-port="0" /> + <edge from-layer="10185" from-port="0" to-layer="10190" to-port="0" /> + <edge from-layer="10186" from-port="0" to-layer="10189" to-port="1" /> + <edge from-layer="10187" from-port="0" to-layer="10189" to-port="2" /> + <edge from-layer="10188" from-port="0" to-layer="10189" to-port="3" /> + <edge from-layer="10189" from-port="4" to-layer="10190" to-port="1" /> + <edge from-layer="10190" from-port="2" to-layer="10191" to-port="0" /> + <edge from-layer="10191" from-port="1" to-layer="10193" to-port="0" /> + <edge from-layer="10192" from-port="0" to-layer="10193" to-port="2" /> + <edge from-layer="10193" from-port="3" to-layer="10289" to-port="0" /> + <edge from-layer="10193" from-port="3" to-layer="10233" to-port="0" /> + <edge from-layer="10194" from-port="0" to-layer="10195" to-port="0" /> + <edge from-layer="10195" from-port="1" to-layer="10198" to-port="0" /> + <edge from-layer="10196" from-port="0" to-layer="10197" to-port="0" /> + <edge from-layer="10197" from-port="1" to-layer="10198" to-port="1" /> + <edge from-layer="10198" from-port="2" to-layer="10200" to-port="0" /> + <edge from-layer="10199" from-port="0" to-layer="10200" to-port="1" /> + <edge from-layer="10200" from-port="2" to-layer="10202" to-port="0" /> + <edge from-layer="10201" from-port="0" to-layer="10202" to-port="1" /> + <edge from-layer="10202" from-port="2" to-layer="10203" to-port="0" /> + <edge from-layer="10203" from-port="1" to-layer="10204" to-port="1" /> + <edge from-layer="10204" from-port="2" to-layer="10207" to-port="0" /> + <edge from-layer="10205" from-port="0" to-layer="10206" to-port="0" /> + <edge from-layer="10206" from-port="1" to-layer="10207" to-port="1" /> + <edge from-layer="10207" from-port="2" to-layer="10209" to-port="0" /> + <edge from-layer="10208" from-port="0" to-layer="10209" to-port="1" /> + <edge from-layer="10209" from-port="2" to-layer="10211" to-port="0" /> + <edge from-layer="10210" from-port="0" to-layer="10211" to-port="1" /> + <edge from-layer="10211" from-port="2" to-layer="10212" to-port="0" /> + <edge from-layer="10211" from-port="2" to-layer="10213" to-port="0" /> + <edge from-layer="10211" from-port="2" to-layer="10223" to-port="0" /> + <edge from-layer="10211" from-port="2" to-layer="10229" to-port="0" /> + <edge from-layer="10212" from-port="2" to-layer="10232" to-port="0" /> + <edge from-layer="10213" from-port="1" to-layer="10215" to-port="0" /> + <edge from-layer="10214" from-port="0" to-layer="10215" to-port="2" /> + <edge from-layer="10215" from-port="3" to-layer="10216" to-port="0" /> + <edge from-layer="10216" from-port="2" to-layer="10217" to-port="0" /> + <edge from-layer="10217" from-port="1" to-layer="10219" to-port="0" /> + <edge from-layer="10218" from-port="0" to-layer="10219" to-port="1" /> + <edge from-layer="10219" from-port="2" to-layer="10229" to-port="2" /> + <edge from-layer="10219" from-port="2" to-layer="10223" to-port="1" /> + <edge from-layer="10220" from-port="0" to-layer="10223" to-port="2" /> + <edge from-layer="10221" from-port="0" to-layer="10223" to-port="3" /> + <edge from-layer="10222" from-port="0" to-layer="10223" to-port="4" /> + <edge from-layer="10223" from-port="5" to-layer="10225" to-port="0" /> + <edge from-layer="10224" from-port="0" to-layer="10225" to-port="1" /> + <edge from-layer="10225" from-port="2" to-layer="10230" to-port="0" /> + <edge from-layer="10226" from-port="0" to-layer="10229" to-port="1" /> + <edge from-layer="10227" from-port="0" to-layer="10229" to-port="3" /> + <edge from-layer="10228" from-port="0" to-layer="10229" to-port="4" /> + <edge from-layer="10229" from-port="5" to-layer="10230" to-port="1" /> + <edge from-layer="10230" from-port="2" to-layer="10231" to-port="0" /> + <edge from-layer="10231" from-port="2" to-layer="10232" to-port="1" /> + <edge from-layer="10232" from-port="2" to-layer="10233" to-port="1" /> + <edge from-layer="10232" from-port="2" to-layer="10293" to-port="0" /> + <edge from-layer="10233" from-port="2" to-layer="10234" to-port="0" /> + <edge from-layer="10233" from-port="2" to-layer="11150" to-port="0" /> + <edge from-layer="10233" from-port="2" to-layer="10235" to-port="0" /> + <edge from-layer="10234" from-port="2" to-layer="10244" to-port="0" /> + <edge from-layer="10235" from-port="1" to-layer="10238" to-port="0" /> + <edge from-layer="10235" from-port="1" to-layer="10242" to-port="0" /> + <edge from-layer="10236" from-port="0" to-layer="10238" to-port="1" /> + <edge from-layer="10237" from-port="0" to-layer="10238" to-port="2" /> + <edge from-layer="10238" from-port="3" to-layer="10243" to-port="0" /> + <edge from-layer="10239" from-port="0" to-layer="10243" to-port="1" /> + <edge from-layer="10240" from-port="0" to-layer="10242" to-port="1" /> + <edge from-layer="10241" from-port="0" to-layer="10242" to-port="2" /> + <edge from-layer="10242" from-port="3" to-layer="10243" to-port="2" /> + <edge from-layer="10243" from-port="3" to-layer="10244" to-port="1" /> + <edge from-layer="10244" from-port="2" to-layer="10246" to-port="0" /> + <edge from-layer="10245" from-port="0" to-layer="10246" to-port="1" /> + <edge from-layer="10246" from-port="2" to-layer="10301" to-port="1" /> + <edge from-layer="10247" from-port="0" to-layer="10252" to-port="0" /> + <edge from-layer="10248" from-port="0" to-layer="10251" to-port="1" /> + <edge from-layer="10249" from-port="0" to-layer="10251" to-port="2" /> + <edge from-layer="10250" from-port="0" to-layer="10251" to-port="3" /> + <edge from-layer="10251" from-port="4" to-layer="10252" to-port="1" /> + <edge from-layer="10252" from-port="2" to-layer="10253" to-port="0" /> + <edge from-layer="10253" from-port="1" to-layer="10255" to-port="0" /> + <edge from-layer="10254" from-port="0" to-layer="10255" to-port="2" /> + <edge from-layer="10255" from-port="3" to-layer="10274" to-port="0" /> + <edge from-layer="10256" from-port="0" to-layer="10257" to-port="0" /> + <edge from-layer="10257" from-port="1" to-layer="10260" to-port="0" /> + <edge from-layer="10258" from-port="0" to-layer="10259" to-port="0" /> + <edge from-layer="10259" from-port="1" to-layer="10260" to-port="1" /> + <edge from-layer="10260" from-port="2" to-layer="10262" to-port="0" /> + <edge from-layer="10261" from-port="0" to-layer="10262" to-port="1" /> + <edge from-layer="10262" from-port="2" to-layer="10264" to-port="0" /> + <edge from-layer="10263" from-port="0" to-layer="10264" to-port="1" /> + <edge from-layer="10264" from-port="2" to-layer="10265" to-port="0" /> + <edge from-layer="10265" from-port="1" to-layer="10266" to-port="1" /> + <edge from-layer="10266" from-port="2" to-layer="10269" to-port="0" /> + <edge from-layer="10267" from-port="0" to-layer="10268" to-port="0" /> + <edge from-layer="10268" from-port="1" to-layer="10269" to-port="1" /> + <edge from-layer="10269" from-port="2" to-layer="10271" to-port="0" /> + <edge from-layer="10270" from-port="0" to-layer="10271" to-port="1" /> + <edge from-layer="10271" from-port="2" to-layer="10273" to-port="0" /> + <edge from-layer="10272" from-port="0" to-layer="10273" to-port="1" /> + <edge from-layer="10273" from-port="2" to-layer="10274" to-port="1" /> + <edge from-layer="10274" from-port="2" to-layer="10276" to-port="0" /> + <edge from-layer="10274" from-port="2" to-layer="10275" to-port="0" /> + <edge from-layer="10274" from-port="2" to-layer="11149" to-port="0" /> + <edge from-layer="10275" from-port="2" to-layer="10285" to-port="0" /> + <edge from-layer="10276" from-port="1" to-layer="10283" to-port="0" /> + <edge from-layer="10276" from-port="1" to-layer="10279" to-port="0" /> + <edge from-layer="10277" from-port="0" to-layer="10279" to-port="1" /> + <edge from-layer="10278" from-port="0" to-layer="10279" to-port="2" /> + <edge from-layer="10279" from-port="3" to-layer="10284" to-port="1" /> + <edge from-layer="10280" from-port="0" to-layer="10284" to-port="2" /> + <edge from-layer="10281" from-port="0" to-layer="10283" to-port="1" /> + <edge from-layer="10282" from-port="0" to-layer="10283" to-port="2" /> + <edge from-layer="10283" from-port="3" to-layer="10284" to-port="3" /> + <edge from-layer="10284" from-port="4" to-layer="10285" to-port="1" /> + <edge from-layer="10285" from-port="2" to-layer="10287" to-port="0" /> + <edge from-layer="10286" from-port="0" to-layer="10287" to-port="1" /> + <edge from-layer="10287" from-port="2" to-layer="10301" to-port="2" /> + <edge from-layer="10288" from-port="0" to-layer="10300" to-port="1" /> + <edge from-layer="10289" from-port="1" to-layer="10292" to-port="0" /> + <edge from-layer="10290" from-port="0" to-layer="10292" to-port="1" /> + <edge from-layer="10291" from-port="0" to-layer="10292" to-port="2" /> + <edge from-layer="10292" from-port="3" to-layer="10297" to-port="0" /> + <edge from-layer="10293" from-port="1" to-layer="10296" to-port="0" /> + <edge from-layer="10294" from-port="0" to-layer="10296" to-port="1" /> + <edge from-layer="10295" from-port="0" to-layer="10296" to-port="2" /> + <edge from-layer="10296" from-port="3" to-layer="10297" to-port="1" /> + <edge from-layer="10297" from-port="2" to-layer="10300" to-port="2" /> + <edge from-layer="10298" from-port="0" to-layer="10300" to-port="3" /> + <edge from-layer="10299" from-port="0" to-layer="10300" to-port="4" /> + <edge from-layer="10300" from-port="5" to-layer="10301" to-port="3" /> + <edge from-layer="10301" from-port="4" to-layer="10303" to-port="0" /> + <edge from-layer="10302" from-port="0" to-layer="10303" to-port="1" /> + <edge from-layer="10303" from-port="2" to-layer="10305" to-port="0" /> + <edge from-layer="10304" from-port="0" to-layer="10305" to-port="1" /> + <edge from-layer="10305" from-port="2" to-layer="10316" to-port="0" /> + <edge from-layer="10306" from-port="0" to-layer="10307" to-port="0" /> + <edge from-layer="10307" from-port="1" to-layer="10310" to-port="0" /> + <edge from-layer="10308" from-port="0" to-layer="10309" to-port="0" /> + <edge from-layer="10309" from-port="1" to-layer="10310" to-port="1" /> + <edge from-layer="10310" from-port="2" to-layer="10312" to-port="0" /> + <edge from-layer="10311" from-port="0" to-layer="10312" to-port="1" /> + <edge from-layer="10312" from-port="2" to-layer="10314" to-port="0" /> + <edge from-layer="10313" from-port="0" to-layer="10314" to-port="1" /> + <edge from-layer="10314" from-port="2" to-layer="10315" to-port="0" /> + <edge from-layer="10315" from-port="1" to-layer="10316" to-port="1" /> + <edge from-layer="10316" from-port="2" to-layer="10317" to-port="1" /> + <edge from-layer="10317" from-port="2" to-layer="10321" to-port="0" /> + <edge from-layer="10317" from-port="2" to-layer="10365" to-port="0" /> + <edge from-layer="10317" from-port="2" to-layer="10328" to-port="0" /> + <edge from-layer="10318" from-port="0" to-layer="10329" to-port="0" /> + <edge from-layer="10319" from-port="0" to-layer="10327" to-port="0" /> + <edge from-layer="10320" from-port="0" to-layer="10321" to-port="1" /> + <edge from-layer="10321" from-port="2" to-layer="10323" to-port="0" /> + <edge from-layer="10322" from-port="0" to-layer="10323" to-port="1" /> + <edge from-layer="10323" from-port="2" to-layer="10325" to-port="0" /> + <edge from-layer="10324" from-port="0" to-layer="10325" to-port="1" /> + <edge from-layer="10325" from-port="2" to-layer="10326" to-port="0" /> + <edge from-layer="10326" from-port="1" to-layer="10327" to-port="1" /> + <edge from-layer="10327" from-port="2" to-layer="10328" to-port="1" /> + <edge from-layer="10328" from-port="2" to-layer="10329" to-port="1" /> + <edge from-layer="10329" from-port="2" to-layer="10340" to-port="0" /> + <edge from-layer="10329" from-port="2" to-layer="10352" to-port="0" /> + <edge from-layer="10330" from-port="0" to-layer="10331" to-port="0" /> + <edge from-layer="10331" from-port="1" to-layer="10334" to-port="0" /> + <edge from-layer="10332" from-port="0" to-layer="10333" to-port="0" /> + <edge from-layer="10333" from-port="1" to-layer="10334" to-port="1" /> + <edge from-layer="10334" from-port="2" to-layer="10336" to-port="0" /> + <edge from-layer="10335" from-port="0" to-layer="10336" to-port="1" /> + <edge from-layer="10336" from-port="2" to-layer="10338" to-port="0" /> + <edge from-layer="10337" from-port="0" to-layer="10338" to-port="1" /> + <edge from-layer="10338" from-port="2" to-layer="10339" to-port="0" /> + <edge from-layer="10339" from-port="1" to-layer="10340" to-port="1" /> + <edge from-layer="10340" from-port="2" to-layer="10341" to-port="0" /> + <edge from-layer="10341" from-port="1" to-layer="10353" to-port="0" /> + <edge from-layer="10342" from-port="0" to-layer="10343" to-port="0" /> + <edge from-layer="10343" from-port="1" to-layer="10346" to-port="0" /> + <edge from-layer="10344" from-port="0" to-layer="10345" to-port="0" /> + <edge from-layer="10345" from-port="1" to-layer="10346" to-port="1" /> + <edge from-layer="10346" from-port="2" to-layer="10348" to-port="0" /> + <edge from-layer="10347" from-port="0" to-layer="10348" to-port="1" /> + <edge from-layer="10348" from-port="2" to-layer="10350" to-port="0" /> + <edge from-layer="10349" from-port="0" to-layer="10350" to-port="1" /> + <edge from-layer="10350" from-port="2" to-layer="10351" to-port="0" /> + <edge from-layer="10351" from-port="1" to-layer="10352" to-port="1" /> + <edge from-layer="10352" from-port="2" to-layer="10353" to-port="1" /> + <edge from-layer="10353" from-port="2" to-layer="10364" to-port="0" /> + <edge from-layer="10354" from-port="0" to-layer="10355" to-port="0" /> + <edge from-layer="10355" from-port="1" to-layer="10358" to-port="0" /> + <edge from-layer="10356" from-port="0" to-layer="10357" to-port="0" /> + <edge from-layer="10357" from-port="1" to-layer="10358" to-port="1" /> + <edge from-layer="10358" from-port="2" to-layer="10360" to-port="0" /> + <edge from-layer="10359" from-port="0" to-layer="10360" to-port="1" /> + <edge from-layer="10360" from-port="2" to-layer="10362" to-port="0" /> + <edge from-layer="10361" from-port="0" to-layer="10362" to-port="1" /> + <edge from-layer="10362" from-port="2" to-layer="10363" to-port="0" /> + <edge from-layer="10363" from-port="1" to-layer="10364" to-port="1" /> + <edge from-layer="10364" from-port="2" to-layer="10365" to-port="1" /> + <edge from-layer="10365" from-port="2" to-layer="10376" to-port="0" /> + <edge from-layer="10365" from-port="2" to-layer="10549" to-port="0" /> + <edge from-layer="10365" from-port="2" to-layer="10369" to-port="0" /> + <edge from-layer="10366" from-port="0" to-layer="10377" to-port="0" /> + <edge from-layer="10367" from-port="0" to-layer="10375" to-port="0" /> + <edge from-layer="10368" from-port="0" to-layer="10369" to-port="1" /> + <edge from-layer="10369" from-port="2" to-layer="10371" to-port="0" /> + <edge from-layer="10370" from-port="0" to-layer="10371" to-port="1" /> + <edge from-layer="10371" from-port="2" to-layer="10373" to-port="0" /> + <edge from-layer="10372" from-port="0" to-layer="10373" to-port="1" /> + <edge from-layer="10373" from-port="2" to-layer="10374" to-port="0" /> + <edge from-layer="10374" from-port="1" to-layer="10375" to-port="1" /> + <edge from-layer="10375" from-port="2" to-layer="10376" to-port="1" /> + <edge from-layer="10376" from-port="2" to-layer="10377" to-port="1" /> + <edge from-layer="10377" from-port="2" to-layer="10388" to-port="0" /> + <edge from-layer="10377" from-port="2" to-layer="10436" to-port="0" /> + <edge from-layer="10377" from-port="2" to-layer="10498" to-port="0" /> + <edge from-layer="10378" from-port="0" to-layer="10379" to-port="0" /> + <edge from-layer="10379" from-port="1" to-layer="10382" to-port="0" /> + <edge from-layer="10380" from-port="0" to-layer="10381" to-port="0" /> + <edge from-layer="10381" from-port="1" to-layer="10382" to-port="1" /> + <edge from-layer="10382" from-port="2" to-layer="10384" to-port="0" /> + <edge from-layer="10383" from-port="0" to-layer="10384" to-port="1" /> + <edge from-layer="10384" from-port="2" to-layer="10386" to-port="0" /> + <edge from-layer="10385" from-port="0" to-layer="10386" to-port="1" /> + <edge from-layer="10386" from-port="2" to-layer="10387" to-port="0" /> + <edge from-layer="10387" from-port="1" to-layer="10388" to-port="1" /> + <edge from-layer="10388" from-port="2" to-layer="10391" to-port="0" /> + <edge from-layer="10389" from-port="0" to-layer="10390" to-port="0" /> + <edge from-layer="10390" from-port="1" to-layer="10391" to-port="1" /> + <edge from-layer="10391" from-port="2" to-layer="10393" to-port="0" /> + <edge from-layer="10392" from-port="0" to-layer="10393" to-port="1" /> + <edge from-layer="10393" from-port="2" to-layer="10395" to-port="0" /> + <edge from-layer="10394" from-port="0" to-layer="10395" to-port="1" /> + <edge from-layer="10395" from-port="2" to-layer="10413" to-port="0" /> + <edge from-layer="10395" from-port="2" to-layer="10397" to-port="0" /> + <edge from-layer="10395" from-port="2" to-layer="10407" to-port="0" /> + <edge from-layer="10395" from-port="2" to-layer="10396" to-port="0" /> + <edge from-layer="10396" from-port="2" to-layer="10416" to-port="0" /> + <edge from-layer="10397" from-port="1" to-layer="10399" to-port="0" /> + <edge from-layer="10398" from-port="0" to-layer="10399" to-port="2" /> + <edge from-layer="10399" from-port="3" to-layer="10400" to-port="0" /> + <edge from-layer="10400" from-port="2" to-layer="10401" to-port="0" /> + <edge from-layer="10401" from-port="1" to-layer="10403" to-port="0" /> + <edge from-layer="10402" from-port="0" to-layer="10403" to-port="1" /> + <edge from-layer="10403" from-port="2" to-layer="10413" to-port="2" /> + <edge from-layer="10403" from-port="2" to-layer="10407" to-port="1" /> + <edge from-layer="10404" from-port="0" to-layer="10407" to-port="2" /> + <edge from-layer="10405" from-port="0" to-layer="10407" to-port="3" /> + <edge from-layer="10406" from-port="0" to-layer="10407" to-port="4" /> + <edge from-layer="10407" from-port="5" to-layer="10409" to-port="0" /> + <edge from-layer="10408" from-port="0" to-layer="10409" to-port="1" /> + <edge from-layer="10409" from-port="2" to-layer="10414" to-port="0" /> + <edge from-layer="10410" from-port="0" to-layer="10413" to-port="1" /> + <edge from-layer="10411" from-port="0" to-layer="10413" to-port="3" /> + <edge from-layer="10412" from-port="0" to-layer="10413" to-port="4" /> + <edge from-layer="10413" from-port="5" to-layer="10414" to-port="1" /> + <edge from-layer="10414" from-port="2" to-layer="10415" to-port="0" /> + <edge from-layer="10415" from-port="2" to-layer="10416" to-port="1" /> + <edge from-layer="10416" from-port="2" to-layer="10533" to-port="0" /> + <edge from-layer="10417" from-port="0" to-layer="10422" to-port="0" /> + <edge from-layer="10418" from-port="0" to-layer="10421" to-port="1" /> + <edge from-layer="10419" from-port="0" to-layer="10421" to-port="2" /> + <edge from-layer="10420" from-port="0" to-layer="10421" to-port="3" /> + <edge from-layer="10421" from-port="4" to-layer="10422" to-port="1" /> + <edge from-layer="10422" from-port="2" to-layer="10423" to-port="0" /> + <edge from-layer="10423" from-port="1" to-layer="10425" to-port="0" /> + <edge from-layer="10424" from-port="0" to-layer="10425" to-port="2" /> + <edge from-layer="10425" from-port="3" to-layer="10465" to-port="0" /> + <edge from-layer="10425" from-port="3" to-layer="10521" to-port="0" /> + <edge from-layer="10426" from-port="0" to-layer="10427" to-port="0" /> + <edge from-layer="10427" from-port="1" to-layer="10430" to-port="0" /> + <edge from-layer="10428" from-port="0" to-layer="10429" to-port="0" /> + <edge from-layer="10429" from-port="1" to-layer="10430" to-port="1" /> + <edge from-layer="10430" from-port="2" to-layer="10432" to-port="0" /> + <edge from-layer="10431" from-port="0" to-layer="10432" to-port="1" /> + <edge from-layer="10432" from-port="2" to-layer="10434" to-port="0" /> + <edge from-layer="10433" from-port="0" to-layer="10434" to-port="1" /> + <edge from-layer="10434" from-port="2" to-layer="10435" to-port="0" /> + <edge from-layer="10435" from-port="1" to-layer="10436" to-port="1" /> + <edge from-layer="10436" from-port="2" to-layer="10439" to-port="0" /> + <edge from-layer="10437" from-port="0" to-layer="10438" to-port="0" /> + <edge from-layer="10438" from-port="1" to-layer="10439" to-port="1" /> + <edge from-layer="10439" from-port="2" to-layer="10441" to-port="0" /> + <edge from-layer="10440" from-port="0" to-layer="10441" to-port="1" /> + <edge from-layer="10441" from-port="2" to-layer="10443" to-port="0" /> + <edge from-layer="10442" from-port="0" to-layer="10443" to-port="1" /> + <edge from-layer="10443" from-port="2" to-layer="10444" to-port="0" /> + <edge from-layer="10443" from-port="2" to-layer="10461" to-port="0" /> + <edge from-layer="10443" from-port="2" to-layer="10455" to-port="0" /> + <edge from-layer="10443" from-port="2" to-layer="10445" to-port="0" /> + <edge from-layer="10444" from-port="2" to-layer="10464" to-port="0" /> + <edge from-layer="10445" from-port="1" to-layer="10447" to-port="0" /> + <edge from-layer="10446" from-port="0" to-layer="10447" to-port="2" /> + <edge from-layer="10447" from-port="3" to-layer="10448" to-port="0" /> + <edge from-layer="10448" from-port="2" to-layer="10449" to-port="0" /> + <edge from-layer="10449" from-port="1" to-layer="10451" to-port="0" /> + <edge from-layer="10450" from-port="0" to-layer="10451" to-port="1" /> + <edge from-layer="10451" from-port="2" to-layer="10455" to-port="1" /> + <edge from-layer="10451" from-port="2" to-layer="10461" to-port="2" /> + <edge from-layer="10452" from-port="0" to-layer="10455" to-port="2" /> + <edge from-layer="10453" from-port="0" to-layer="10455" to-port="3" /> + <edge from-layer="10454" from-port="0" to-layer="10455" to-port="4" /> + <edge from-layer="10455" from-port="5" to-layer="10457" to-port="0" /> + <edge from-layer="10456" from-port="0" to-layer="10457" to-port="1" /> + <edge from-layer="10457" from-port="2" to-layer="10462" to-port="0" /> + <edge from-layer="10458" from-port="0" to-layer="10461" to-port="1" /> + <edge from-layer="10459" from-port="0" to-layer="10461" to-port="3" /> + <edge from-layer="10460" from-port="0" to-layer="10461" to-port="4" /> + <edge from-layer="10461" from-port="5" to-layer="10462" to-port="1" /> + <edge from-layer="10462" from-port="2" to-layer="10463" to-port="0" /> + <edge from-layer="10463" from-port="2" to-layer="10464" to-port="1" /> + <edge from-layer="10464" from-port="2" to-layer="10525" to-port="0" /> + <edge from-layer="10464" from-port="2" to-layer="10465" to-port="1" /> + <edge from-layer="10465" from-port="2" to-layer="11148" to-port="0" /> + <edge from-layer="10465" from-port="2" to-layer="10466" to-port="0" /> + <edge from-layer="10465" from-port="2" to-layer="10467" to-port="0" /> + <edge from-layer="10466" from-port="2" to-layer="10476" to-port="0" /> + <edge from-layer="10467" from-port="1" to-layer="10470" to-port="0" /> + <edge from-layer="10467" from-port="1" to-layer="10474" to-port="0" /> + <edge from-layer="10468" from-port="0" to-layer="10470" to-port="1" /> + <edge from-layer="10469" from-port="0" to-layer="10470" to-port="2" /> + <edge from-layer="10470" from-port="3" to-layer="10475" to-port="0" /> + <edge from-layer="10471" from-port="0" to-layer="10475" to-port="1" /> + <edge from-layer="10472" from-port="0" to-layer="10474" to-port="1" /> + <edge from-layer="10473" from-port="0" to-layer="10474" to-port="2" /> + <edge from-layer="10474" from-port="3" to-layer="10475" to-port="2" /> + <edge from-layer="10475" from-port="3" to-layer="10476" to-port="1" /> + <edge from-layer="10476" from-port="2" to-layer="10478" to-port="0" /> + <edge from-layer="10477" from-port="0" to-layer="10478" to-port="1" /> + <edge from-layer="10478" from-port="2" to-layer="10533" to-port="1" /> + <edge from-layer="10479" from-port="0" to-layer="10484" to-port="0" /> + <edge from-layer="10480" from-port="0" to-layer="10483" to-port="1" /> + <edge from-layer="10481" from-port="0" to-layer="10483" to-port="2" /> + <edge from-layer="10482" from-port="0" to-layer="10483" to-port="3" /> + <edge from-layer="10483" from-port="4" to-layer="10484" to-port="1" /> + <edge from-layer="10484" from-port="2" to-layer="10485" to-port="0" /> + <edge from-layer="10485" from-port="1" to-layer="10487" to-port="0" /> + <edge from-layer="10486" from-port="0" to-layer="10487" to-port="2" /> + <edge from-layer="10487" from-port="3" to-layer="10506" to-port="0" /> + <edge from-layer="10488" from-port="0" to-layer="10489" to-port="0" /> + <edge from-layer="10489" from-port="1" to-layer="10492" to-port="0" /> + <edge from-layer="10490" from-port="0" to-layer="10491" to-port="0" /> + <edge from-layer="10491" from-port="1" to-layer="10492" to-port="1" /> + <edge from-layer="10492" from-port="2" to-layer="10494" to-port="0" /> + <edge from-layer="10493" from-port="0" to-layer="10494" to-port="1" /> + <edge from-layer="10494" from-port="2" to-layer="10496" to-port="0" /> + <edge from-layer="10495" from-port="0" to-layer="10496" to-port="1" /> + <edge from-layer="10496" from-port="2" to-layer="10497" to-port="0" /> + <edge from-layer="10497" from-port="1" to-layer="10498" to-port="1" /> + <edge from-layer="10498" from-port="2" to-layer="10501" to-port="0" /> + <edge from-layer="10499" from-port="0" to-layer="10500" to-port="0" /> + <edge from-layer="10500" from-port="1" to-layer="10501" to-port="1" /> + <edge from-layer="10501" from-port="2" to-layer="10503" to-port="0" /> + <edge from-layer="10502" from-port="0" to-layer="10503" to-port="1" /> + <edge from-layer="10503" from-port="2" to-layer="10505" to-port="0" /> + <edge from-layer="10504" from-port="0" to-layer="10505" to-port="1" /> + <edge from-layer="10505" from-port="2" to-layer="10506" to-port="1" /> + <edge from-layer="10506" from-port="2" to-layer="10507" to-port="0" /> + <edge from-layer="10506" from-port="2" to-layer="10508" to-port="0" /> + <edge from-layer="10506" from-port="2" to-layer="11147" to-port="0" /> + <edge from-layer="10507" from-port="2" to-layer="10517" to-port="0" /> + <edge from-layer="10508" from-port="1" to-layer="10511" to-port="0" /> + <edge from-layer="10508" from-port="1" to-layer="10515" to-port="0" /> + <edge from-layer="10509" from-port="0" to-layer="10511" to-port="1" /> + <edge from-layer="10510" from-port="0" to-layer="10511" to-port="2" /> + <edge from-layer="10511" from-port="3" to-layer="10516" to-port="1" /> + <edge from-layer="10512" from-port="0" to-layer="10516" to-port="2" /> + <edge from-layer="10513" from-port="0" to-layer="10515" to-port="1" /> + <edge from-layer="10514" from-port="0" to-layer="10515" to-port="2" /> + <edge from-layer="10515" from-port="3" to-layer="10516" to-port="3" /> + <edge from-layer="10516" from-port="4" to-layer="10517" to-port="1" /> + <edge from-layer="10517" from-port="2" to-layer="10519" to-port="0" /> + <edge from-layer="10518" from-port="0" to-layer="10519" to-port="1" /> + <edge from-layer="10519" from-port="2" to-layer="10533" to-port="2" /> + <edge from-layer="10520" from-port="0" to-layer="10532" to-port="1" /> + <edge from-layer="10521" from-port="1" to-layer="10524" to-port="0" /> + <edge from-layer="10522" from-port="0" to-layer="10524" to-port="1" /> + <edge from-layer="10523" from-port="0" to-layer="10524" to-port="2" /> + <edge from-layer="10524" from-port="3" to-layer="10529" to-port="0" /> + <edge from-layer="10525" from-port="1" to-layer="10528" to-port="0" /> + <edge from-layer="10526" from-port="0" to-layer="10528" to-port="1" /> + <edge from-layer="10527" from-port="0" to-layer="10528" to-port="2" /> + <edge from-layer="10528" from-port="3" to-layer="10529" to-port="1" /> + <edge from-layer="10529" from-port="2" to-layer="10532" to-port="2" /> + <edge from-layer="10530" from-port="0" to-layer="10532" to-port="3" /> + <edge from-layer="10531" from-port="0" to-layer="10532" to-port="4" /> + <edge from-layer="10532" from-port="5" to-layer="10533" to-port="3" /> + <edge from-layer="10533" from-port="4" to-layer="10535" to-port="0" /> + <edge from-layer="10534" from-port="0" to-layer="10535" to-port="1" /> + <edge from-layer="10535" from-port="2" to-layer="10537" to-port="0" /> + <edge from-layer="10536" from-port="0" to-layer="10537" to-port="1" /> + <edge from-layer="10537" from-port="2" to-layer="10548" to-port="0" /> + <edge from-layer="10538" from-port="0" to-layer="10539" to-port="0" /> + <edge from-layer="10539" from-port="1" to-layer="10542" to-port="0" /> + <edge from-layer="10540" from-port="0" to-layer="10541" to-port="0" /> + <edge from-layer="10541" from-port="1" to-layer="10542" to-port="1" /> + <edge from-layer="10542" from-port="2" to-layer="10544" to-port="0" /> + <edge from-layer="10543" from-port="0" to-layer="10544" to-port="1" /> + <edge from-layer="10544" from-port="2" to-layer="10546" to-port="0" /> + <edge from-layer="10545" from-port="0" to-layer="10546" to-port="1" /> + <edge from-layer="10546" from-port="2" to-layer="10547" to-port="0" /> + <edge from-layer="10547" from-port="1" to-layer="10548" to-port="1" /> + <edge from-layer="10548" from-port="2" to-layer="10549" to-port="1" /> + <edge from-layer="10549" from-port="2" to-layer="10553" to-port="0" /> + <edge from-layer="10549" from-port="2" to-layer="10560" to-port="0" /> + <edge from-layer="10549" from-port="2" to-layer="10597" to-port="0" /> + <edge from-layer="10550" from-port="0" to-layer="10561" to-port="0" /> + <edge from-layer="10551" from-port="0" to-layer="10559" to-port="0" /> + <edge from-layer="10552" from-port="0" to-layer="10553" to-port="1" /> + <edge from-layer="10553" from-port="2" to-layer="10555" to-port="0" /> + <edge from-layer="10554" from-port="0" to-layer="10555" to-port="1" /> + <edge from-layer="10555" from-port="2" to-layer="10557" to-port="0" /> + <edge from-layer="10556" from-port="0" to-layer="10557" to-port="1" /> + <edge from-layer="10557" from-port="2" to-layer="10558" to-port="0" /> + <edge from-layer="10558" from-port="1" to-layer="10559" to-port="1" /> + <edge from-layer="10559" from-port="2" to-layer="10560" to-port="1" /> + <edge from-layer="10560" from-port="2" to-layer="10561" to-port="1" /> + <edge from-layer="10561" from-port="2" to-layer="10572" to-port="0" /> + <edge from-layer="10561" from-port="2" to-layer="10584" to-port="0" /> + <edge from-layer="10562" from-port="0" to-layer="10563" to-port="0" /> + <edge from-layer="10563" from-port="1" to-layer="10566" to-port="0" /> + <edge from-layer="10564" from-port="0" to-layer="10565" to-port="0" /> + <edge from-layer="10565" from-port="1" to-layer="10566" to-port="1" /> + <edge from-layer="10566" from-port="2" to-layer="10568" to-port="0" /> + <edge from-layer="10567" from-port="0" to-layer="10568" to-port="1" /> + <edge from-layer="10568" from-port="2" to-layer="10570" to-port="0" /> + <edge from-layer="10569" from-port="0" to-layer="10570" to-port="1" /> + <edge from-layer="10570" from-port="2" to-layer="10571" to-port="0" /> + <edge from-layer="10571" from-port="1" to-layer="10572" to-port="1" /> + <edge from-layer="10572" from-port="2" to-layer="10573" to-port="0" /> + <edge from-layer="10573" from-port="1" to-layer="10585" to-port="0" /> + <edge from-layer="10574" from-port="0" to-layer="10575" to-port="0" /> + <edge from-layer="10575" from-port="1" to-layer="10578" to-port="0" /> + <edge from-layer="10576" from-port="0" to-layer="10577" to-port="0" /> + <edge from-layer="10577" from-port="1" to-layer="10578" to-port="1" /> + <edge from-layer="10578" from-port="2" to-layer="10580" to-port="0" /> + <edge from-layer="10579" from-port="0" to-layer="10580" to-port="1" /> + <edge from-layer="10580" from-port="2" to-layer="10582" to-port="0" /> + <edge from-layer="10581" from-port="0" to-layer="10582" to-port="1" /> + <edge from-layer="10582" from-port="2" to-layer="10583" to-port="0" /> + <edge from-layer="10583" from-port="1" to-layer="10584" to-port="1" /> + <edge from-layer="10584" from-port="2" to-layer="10585" to-port="1" /> + <edge from-layer="10585" from-port="2" to-layer="10596" to-port="0" /> + <edge from-layer="10586" from-port="0" to-layer="10587" to-port="0" /> + <edge from-layer="10587" from-port="1" to-layer="10590" to-port="0" /> + <edge from-layer="10588" from-port="0" to-layer="10589" to-port="0" /> + <edge from-layer="10589" from-port="1" to-layer="10590" to-port="1" /> + <edge from-layer="10590" from-port="2" to-layer="10592" to-port="0" /> + <edge from-layer="10591" from-port="0" to-layer="10592" to-port="1" /> + <edge from-layer="10592" from-port="2" to-layer="10594" to-port="0" /> + <edge from-layer="10593" from-port="0" to-layer="10594" to-port="1" /> + <edge from-layer="10594" from-port="2" to-layer="10595" to-port="0" /> + <edge from-layer="10595" from-port="1" to-layer="10596" to-port="1" /> + <edge from-layer="10596" from-port="2" to-layer="10597" to-port="1" /> + <edge from-layer="10597" from-port="2" to-layer="10781" to-port="0" /> + <edge from-layer="10597" from-port="2" to-layer="10601" to-port="0" /> + <edge from-layer="10597" from-port="2" to-layer="10608" to-port="0" /> + <edge from-layer="10598" from-port="0" to-layer="10609" to-port="0" /> + <edge from-layer="10599" from-port="0" to-layer="10607" to-port="0" /> + <edge from-layer="10600" from-port="0" to-layer="10601" to-port="1" /> + <edge from-layer="10601" from-port="2" to-layer="10603" to-port="0" /> + <edge from-layer="10602" from-port="0" to-layer="10603" to-port="1" /> + <edge from-layer="10603" from-port="2" to-layer="10605" to-port="0" /> + <edge from-layer="10604" from-port="0" to-layer="10605" to-port="1" /> + <edge from-layer="10605" from-port="2" to-layer="10606" to-port="0" /> + <edge from-layer="10606" from-port="1" to-layer="10607" to-port="1" /> + <edge from-layer="10607" from-port="2" to-layer="10608" to-port="1" /> + <edge from-layer="10608" from-port="2" to-layer="10609" to-port="1" /> + <edge from-layer="10609" from-port="2" to-layer="10668" to-port="0" /> + <edge from-layer="10609" from-port="2" to-layer="10730" to-port="0" /> + <edge from-layer="10609" from-port="2" to-layer="10620" to-port="0" /> + <edge from-layer="10610" from-port="0" to-layer="10611" to-port="0" /> + <edge from-layer="10611" from-port="1" to-layer="10614" to-port="0" /> + <edge from-layer="10612" from-port="0" to-layer="10613" to-port="0" /> + <edge from-layer="10613" from-port="1" to-layer="10614" to-port="1" /> + <edge from-layer="10614" from-port="2" to-layer="10616" to-port="0" /> + <edge from-layer="10615" from-port="0" to-layer="10616" to-port="1" /> + <edge from-layer="10616" from-port="2" to-layer="10618" to-port="0" /> + <edge from-layer="10617" from-port="0" to-layer="10618" to-port="1" /> + <edge from-layer="10618" from-port="2" to-layer="10619" to-port="0" /> + <edge from-layer="10619" from-port="1" to-layer="10620" to-port="1" /> + <edge from-layer="10620" from-port="2" to-layer="10623" to-port="0" /> + <edge from-layer="10621" from-port="0" to-layer="10622" to-port="0" /> + <edge from-layer="10622" from-port="1" to-layer="10623" to-port="1" /> + <edge from-layer="10623" from-port="2" to-layer="10625" to-port="0" /> + <edge from-layer="10624" from-port="0" to-layer="10625" to-port="1" /> + <edge from-layer="10625" from-port="2" to-layer="10627" to-port="0" /> + <edge from-layer="10626" from-port="0" to-layer="10627" to-port="1" /> + <edge from-layer="10627" from-port="2" to-layer="10639" to-port="0" /> + <edge from-layer="10627" from-port="2" to-layer="10628" to-port="0" /> + <edge from-layer="10627" from-port="2" to-layer="10629" to-port="0" /> + <edge from-layer="10627" from-port="2" to-layer="10645" to-port="0" /> + <edge from-layer="10628" from-port="2" to-layer="10648" to-port="0" /> + <edge from-layer="10629" from-port="1" to-layer="10631" to-port="0" /> + <edge from-layer="10630" from-port="0" to-layer="10631" to-port="2" /> + <edge from-layer="10631" from-port="3" to-layer="10632" to-port="0" /> + <edge from-layer="10632" from-port="2" to-layer="10633" to-port="0" /> + <edge from-layer="10633" from-port="1" to-layer="10635" to-port="0" /> + <edge from-layer="10634" from-port="0" to-layer="10635" to-port="1" /> + <edge from-layer="10635" from-port="2" to-layer="10639" to-port="1" /> + <edge from-layer="10635" from-port="2" to-layer="10645" to-port="2" /> + <edge from-layer="10636" from-port="0" to-layer="10639" to-port="2" /> + <edge from-layer="10637" from-port="0" to-layer="10639" to-port="3" /> + <edge from-layer="10638" from-port="0" to-layer="10639" to-port="4" /> + <edge from-layer="10639" from-port="5" to-layer="10641" to-port="0" /> + <edge from-layer="10640" from-port="0" to-layer="10641" to-port="1" /> + <edge from-layer="10641" from-port="2" to-layer="10646" to-port="0" /> + <edge from-layer="10642" from-port="0" to-layer="10645" to-port="1" /> + <edge from-layer="10643" from-port="0" to-layer="10645" to-port="3" /> + <edge from-layer="10644" from-port="0" to-layer="10645" to-port="4" /> + <edge from-layer="10645" from-port="5" to-layer="10646" to-port="1" /> + <edge from-layer="10646" from-port="2" to-layer="10647" to-port="0" /> + <edge from-layer="10647" from-port="2" to-layer="10648" to-port="1" /> + <edge from-layer="10648" from-port="2" to-layer="10765" to-port="0" /> + <edge from-layer="10649" from-port="0" to-layer="10654" to-port="0" /> + <edge from-layer="10650" from-port="0" to-layer="10653" to-port="1" /> + <edge from-layer="10651" from-port="0" to-layer="10653" to-port="2" /> + <edge from-layer="10652" from-port="0" to-layer="10653" to-port="3" /> + <edge from-layer="10653" from-port="4" to-layer="10654" to-port="1" /> + <edge from-layer="10654" from-port="2" to-layer="10655" to-port="0" /> + <edge from-layer="10655" from-port="1" to-layer="10657" to-port="0" /> + <edge from-layer="10656" from-port="0" to-layer="10657" to-port="2" /> + <edge from-layer="10657" from-port="3" to-layer="10697" to-port="0" /> + <edge from-layer="10657" from-port="3" to-layer="10753" to-port="0" /> + <edge from-layer="10658" from-port="0" to-layer="10659" to-port="0" /> + <edge from-layer="10659" from-port="1" to-layer="10662" to-port="0" /> + <edge from-layer="10660" from-port="0" to-layer="10661" to-port="0" /> + <edge from-layer="10661" from-port="1" to-layer="10662" to-port="1" /> + <edge from-layer="10662" from-port="2" to-layer="10664" to-port="0" /> + <edge from-layer="10663" from-port="0" to-layer="10664" to-port="1" /> + <edge from-layer="10664" from-port="2" to-layer="10666" to-port="0" /> + <edge from-layer="10665" from-port="0" to-layer="10666" to-port="1" /> + <edge from-layer="10666" from-port="2" to-layer="10667" to-port="0" /> + <edge from-layer="10667" from-port="1" to-layer="10668" to-port="1" /> + <edge from-layer="10668" from-port="2" to-layer="10671" to-port="0" /> + <edge from-layer="10669" from-port="0" to-layer="10670" to-port="0" /> + <edge from-layer="10670" from-port="1" to-layer="10671" to-port="1" /> + <edge from-layer="10671" from-port="2" to-layer="10673" to-port="0" /> + <edge from-layer="10672" from-port="0" to-layer="10673" to-port="1" /> + <edge from-layer="10673" from-port="2" to-layer="10675" to-port="0" /> + <edge from-layer="10674" from-port="0" to-layer="10675" to-port="1" /> + <edge from-layer="10675" from-port="2" to-layer="10693" to-port="0" /> + <edge from-layer="10675" from-port="2" to-layer="10676" to-port="0" /> + <edge from-layer="10675" from-port="2" to-layer="10677" to-port="0" /> + <edge from-layer="10675" from-port="2" to-layer="10687" to-port="0" /> + <edge from-layer="10676" from-port="2" to-layer="10696" to-port="0" /> + <edge from-layer="10677" from-port="1" to-layer="10679" to-port="0" /> + <edge from-layer="10678" from-port="0" to-layer="10679" to-port="2" /> + <edge from-layer="10679" from-port="3" to-layer="10680" to-port="0" /> + <edge from-layer="10680" from-port="2" to-layer="10681" to-port="0" /> + <edge from-layer="10681" from-port="1" to-layer="10683" to-port="0" /> + <edge from-layer="10682" from-port="0" to-layer="10683" to-port="1" /> + <edge from-layer="10683" from-port="2" to-layer="10693" to-port="2" /> + <edge from-layer="10683" from-port="2" to-layer="10687" to-port="1" /> + <edge from-layer="10684" from-port="0" to-layer="10687" to-port="2" /> + <edge from-layer="10685" from-port="0" to-layer="10687" to-port="3" /> + <edge from-layer="10686" from-port="0" to-layer="10687" to-port="4" /> + <edge from-layer="10687" from-port="5" to-layer="10689" to-port="0" /> + <edge from-layer="10688" from-port="0" to-layer="10689" to-port="1" /> + <edge from-layer="10689" from-port="2" to-layer="10694" to-port="0" /> + <edge from-layer="10690" from-port="0" to-layer="10693" to-port="1" /> + <edge from-layer="10691" from-port="0" to-layer="10693" to-port="3" /> + <edge from-layer="10692" from-port="0" to-layer="10693" to-port="4" /> + <edge from-layer="10693" from-port="5" to-layer="10694" to-port="1" /> + <edge from-layer="10694" from-port="2" to-layer="10695" to-port="0" /> + <edge from-layer="10695" from-port="2" to-layer="10696" to-port="1" /> + <edge from-layer="10696" from-port="2" to-layer="10697" to-port="1" /> + <edge from-layer="10696" from-port="2" to-layer="10757" to-port="0" /> + <edge from-layer="10697" from-port="2" to-layer="11146" to-port="0" /> + <edge from-layer="10697" from-port="2" to-layer="10698" to-port="0" /> + <edge from-layer="10697" from-port="2" to-layer="10699" to-port="0" /> + <edge from-layer="10698" from-port="2" to-layer="10708" to-port="0" /> + <edge from-layer="10699" from-port="1" to-layer="10706" to-port="0" /> + <edge from-layer="10699" from-port="1" to-layer="10702" to-port="0" /> + <edge from-layer="10700" from-port="0" to-layer="10702" to-port="1" /> + <edge from-layer="10701" from-port="0" to-layer="10702" to-port="2" /> + <edge from-layer="10702" from-port="3" to-layer="10707" to-port="0" /> + <edge from-layer="10703" from-port="0" to-layer="10707" to-port="1" /> + <edge from-layer="10704" from-port="0" to-layer="10706" to-port="1" /> + <edge from-layer="10705" from-port="0" to-layer="10706" to-port="2" /> + <edge from-layer="10706" from-port="3" to-layer="10707" to-port="2" /> + <edge from-layer="10707" from-port="3" to-layer="10708" to-port="1" /> + <edge from-layer="10708" from-port="2" to-layer="10710" to-port="0" /> + <edge from-layer="10709" from-port="0" to-layer="10710" to-port="1" /> + <edge from-layer="10710" from-port="2" to-layer="10765" to-port="1" /> + <edge from-layer="10711" from-port="0" to-layer="10716" to-port="0" /> + <edge from-layer="10712" from-port="0" to-layer="10715" to-port="1" /> + <edge from-layer="10713" from-port="0" to-layer="10715" to-port="2" /> + <edge from-layer="10714" from-port="0" to-layer="10715" to-port="3" /> + <edge from-layer="10715" from-port="4" to-layer="10716" to-port="1" /> + <edge from-layer="10716" from-port="2" to-layer="10717" to-port="0" /> + <edge from-layer="10717" from-port="1" to-layer="10719" to-port="0" /> + <edge from-layer="10718" from-port="0" to-layer="10719" to-port="2" /> + <edge from-layer="10719" from-port="3" to-layer="10738" to-port="0" /> + <edge from-layer="10720" from-port="0" to-layer="10721" to-port="0" /> + <edge from-layer="10721" from-port="1" to-layer="10724" to-port="0" /> + <edge from-layer="10722" from-port="0" to-layer="10723" to-port="0" /> + <edge from-layer="10723" from-port="1" to-layer="10724" to-port="1" /> + <edge from-layer="10724" from-port="2" to-layer="10726" to-port="0" /> + <edge from-layer="10725" from-port="0" to-layer="10726" to-port="1" /> + <edge from-layer="10726" from-port="2" to-layer="10728" to-port="0" /> + <edge from-layer="10727" from-port="0" to-layer="10728" to-port="1" /> + <edge from-layer="10728" from-port="2" to-layer="10729" to-port="0" /> + <edge from-layer="10729" from-port="1" to-layer="10730" to-port="1" /> + <edge from-layer="10730" from-port="2" to-layer="10733" to-port="0" /> + <edge from-layer="10731" from-port="0" to-layer="10732" to-port="0" /> + <edge from-layer="10732" from-port="1" to-layer="10733" to-port="1" /> + <edge from-layer="10733" from-port="2" to-layer="10735" to-port="0" /> + <edge from-layer="10734" from-port="0" to-layer="10735" to-port="1" /> + <edge from-layer="10735" from-port="2" to-layer="10737" to-port="0" /> + <edge from-layer="10736" from-port="0" to-layer="10737" to-port="1" /> + <edge from-layer="10737" from-port="2" to-layer="10738" to-port="1" /> + <edge from-layer="10738" from-port="2" to-layer="10739" to-port="0" /> + <edge from-layer="10738" from-port="2" to-layer="10740" to-port="0" /> + <edge from-layer="10738" from-port="2" to-layer="11145" to-port="0" /> + <edge from-layer="10739" from-port="2" to-layer="10749" to-port="0" /> + <edge from-layer="10740" from-port="1" to-layer="10743" to-port="0" /> + <edge from-layer="10740" from-port="1" to-layer="10747" to-port="0" /> + <edge from-layer="10741" from-port="0" to-layer="10743" to-port="1" /> + <edge from-layer="10742" from-port="0" to-layer="10743" to-port="2" /> + <edge from-layer="10743" from-port="3" to-layer="10748" to-port="1" /> + <edge from-layer="10744" from-port="0" to-layer="10748" to-port="2" /> + <edge from-layer="10745" from-port="0" to-layer="10747" to-port="1" /> + <edge from-layer="10746" from-port="0" to-layer="10747" to-port="2" /> + <edge from-layer="10747" from-port="3" to-layer="10748" to-port="3" /> + <edge from-layer="10748" from-port="4" to-layer="10749" to-port="1" /> + <edge from-layer="10749" from-port="2" to-layer="10751" to-port="0" /> + <edge from-layer="10750" from-port="0" to-layer="10751" to-port="1" /> + <edge from-layer="10751" from-port="2" to-layer="10765" to-port="2" /> + <edge from-layer="10752" from-port="0" to-layer="10764" to-port="1" /> + <edge from-layer="10753" from-port="1" to-layer="10756" to-port="0" /> + <edge from-layer="10754" from-port="0" to-layer="10756" to-port="1" /> + <edge from-layer="10755" from-port="0" to-layer="10756" to-port="2" /> + <edge from-layer="10756" from-port="3" to-layer="10761" to-port="0" /> + <edge from-layer="10757" from-port="1" to-layer="10760" to-port="0" /> + <edge from-layer="10758" from-port="0" to-layer="10760" to-port="1" /> + <edge from-layer="10759" from-port="0" to-layer="10760" to-port="2" /> + <edge from-layer="10760" from-port="3" to-layer="10761" to-port="1" /> + <edge from-layer="10761" from-port="2" to-layer="10764" to-port="2" /> + <edge from-layer="10762" from-port="0" to-layer="10764" to-port="3" /> + <edge from-layer="10763" from-port="0" to-layer="10764" to-port="4" /> + <edge from-layer="10764" from-port="5" to-layer="10765" to-port="3" /> + <edge from-layer="10765" from-port="4" to-layer="10767" to-port="0" /> + <edge from-layer="10766" from-port="0" to-layer="10767" to-port="1" /> + <edge from-layer="10767" from-port="2" to-layer="10769" to-port="0" /> + <edge from-layer="10768" from-port="0" to-layer="10769" to-port="1" /> + <edge from-layer="10769" from-port="2" to-layer="10780" to-port="0" /> + <edge from-layer="10770" from-port="0" to-layer="10771" to-port="0" /> + <edge from-layer="10771" from-port="1" to-layer="10774" to-port="0" /> + <edge from-layer="10772" from-port="0" to-layer="10773" to-port="0" /> + <edge from-layer="10773" from-port="1" to-layer="10774" to-port="1" /> + <edge from-layer="10774" from-port="2" to-layer="10776" to-port="0" /> + <edge from-layer="10775" from-port="0" to-layer="10776" to-port="1" /> + <edge from-layer="10776" from-port="2" to-layer="10778" to-port="0" /> + <edge from-layer="10777" from-port="0" to-layer="10778" to-port="1" /> + <edge from-layer="10778" from-port="2" to-layer="10779" to-port="0" /> + <edge from-layer="10779" from-port="1" to-layer="10780" to-port="1" /> + <edge from-layer="10780" from-port="2" to-layer="10781" to-port="1" /> + <edge from-layer="10781" from-port="2" to-layer="10829" to-port="0" /> + <edge from-layer="10781" from-port="2" to-layer="10785" to-port="0" /> + <edge from-layer="10781" from-port="2" to-layer="10792" to-port="0" /> + <edge from-layer="10782" from-port="0" to-layer="10793" to-port="0" /> + <edge from-layer="10783" from-port="0" to-layer="10791" to-port="0" /> + <edge from-layer="10784" from-port="0" to-layer="10785" to-port="1" /> + <edge from-layer="10785" from-port="2" to-layer="10787" to-port="0" /> + <edge from-layer="10786" from-port="0" to-layer="10787" to-port="1" /> + <edge from-layer="10787" from-port="2" to-layer="10789" to-port="0" /> + <edge from-layer="10788" from-port="0" to-layer="10789" to-port="1" /> + <edge from-layer="10789" from-port="2" to-layer="10790" to-port="0" /> + <edge from-layer="10790" from-port="1" to-layer="10791" to-port="1" /> + <edge from-layer="10791" from-port="2" to-layer="10792" to-port="1" /> + <edge from-layer="10792" from-port="2" to-layer="10793" to-port="1" /> + <edge from-layer="10793" from-port="2" to-layer="10816" to-port="0" /> + <edge from-layer="10793" from-port="2" to-layer="10804" to-port="0" /> + <edge from-layer="10794" from-port="0" to-layer="10795" to-port="0" /> + <edge from-layer="10795" from-port="1" to-layer="10798" to-port="0" /> + <edge from-layer="10796" from-port="0" to-layer="10797" to-port="0" /> + <edge from-layer="10797" from-port="1" to-layer="10798" to-port="1" /> + <edge from-layer="10798" from-port="2" to-layer="10800" to-port="0" /> + <edge from-layer="10799" from-port="0" to-layer="10800" to-port="1" /> + <edge from-layer="10800" from-port="2" to-layer="10802" to-port="0" /> + <edge from-layer="10801" from-port="0" to-layer="10802" to-port="1" /> + <edge from-layer="10802" from-port="2" to-layer="10803" to-port="0" /> + <edge from-layer="10803" from-port="1" to-layer="10804" to-port="1" /> + <edge from-layer="10804" from-port="2" to-layer="10805" to-port="0" /> + <edge from-layer="10805" from-port="1" to-layer="10817" to-port="0" /> + <edge from-layer="10806" from-port="0" to-layer="10807" to-port="0" /> + <edge from-layer="10807" from-port="1" to-layer="10810" to-port="0" /> + <edge from-layer="10808" from-port="0" to-layer="10809" to-port="0" /> + <edge from-layer="10809" from-port="1" to-layer="10810" to-port="1" /> + <edge from-layer="10810" from-port="2" to-layer="10812" to-port="0" /> + <edge from-layer="10811" from-port="0" to-layer="10812" to-port="1" /> + <edge from-layer="10812" from-port="2" to-layer="10814" to-port="0" /> + <edge from-layer="10813" from-port="0" to-layer="10814" to-port="1" /> + <edge from-layer="10814" from-port="2" to-layer="10815" to-port="0" /> + <edge from-layer="10815" from-port="1" to-layer="10816" to-port="1" /> + <edge from-layer="10816" from-port="2" to-layer="10817" to-port="1" /> + <edge from-layer="10817" from-port="2" to-layer="10828" to-port="0" /> + <edge from-layer="10818" from-port="0" to-layer="10819" to-port="0" /> + <edge from-layer="10819" from-port="1" to-layer="10822" to-port="0" /> + <edge from-layer="10820" from-port="0" to-layer="10821" to-port="0" /> + <edge from-layer="10821" from-port="1" to-layer="10822" to-port="1" /> + <edge from-layer="10822" from-port="2" to-layer="10824" to-port="0" /> + <edge from-layer="10823" from-port="0" to-layer="10824" to-port="1" /> + <edge from-layer="10824" from-port="2" to-layer="10826" to-port="0" /> + <edge from-layer="10825" from-port="0" to-layer="10826" to-port="1" /> + <edge from-layer="10826" from-port="2" to-layer="10827" to-port="0" /> + <edge from-layer="10827" from-port="1" to-layer="10828" to-port="1" /> + <edge from-layer="10828" from-port="2" to-layer="10829" to-port="1" /> + <edge from-layer="10829" from-port="2" to-layer="11013" to-port="0" /> + <edge from-layer="10829" from-port="2" to-layer="10833" to-port="0" /> + <edge from-layer="10829" from-port="2" to-layer="10840" to-port="0" /> + <edge from-layer="10830" from-port="0" to-layer="10841" to-port="0" /> + <edge from-layer="10831" from-port="0" to-layer="10839" to-port="0" /> + <edge from-layer="10832" from-port="0" to-layer="10833" to-port="1" /> + <edge from-layer="10833" from-port="2" to-layer="10835" to-port="0" /> + <edge from-layer="10834" from-port="0" to-layer="10835" to-port="1" /> + <edge from-layer="10835" from-port="2" to-layer="10837" to-port="0" /> + <edge from-layer="10836" from-port="0" to-layer="10837" to-port="1" /> + <edge from-layer="10837" from-port="2" to-layer="10838" to-port="0" /> + <edge from-layer="10838" from-port="1" to-layer="10839" to-port="1" /> + <edge from-layer="10839" from-port="2" to-layer="10840" to-port="1" /> + <edge from-layer="10840" from-port="2" to-layer="10841" to-port="1" /> + <edge from-layer="10841" from-port="2" to-layer="10900" to-port="0" /> + <edge from-layer="10841" from-port="2" to-layer="10962" to-port="0" /> + <edge from-layer="10841" from-port="2" to-layer="10852" to-port="0" /> + <edge from-layer="10842" from-port="0" to-layer="10843" to-port="0" /> + <edge from-layer="10843" from-port="1" to-layer="10846" to-port="0" /> + <edge from-layer="10844" from-port="0" to-layer="10845" to-port="0" /> + <edge from-layer="10845" from-port="1" to-layer="10846" to-port="1" /> + <edge from-layer="10846" from-port="2" to-layer="10848" to-port="0" /> + <edge from-layer="10847" from-port="0" to-layer="10848" to-port="1" /> + <edge from-layer="10848" from-port="2" to-layer="10850" to-port="0" /> + <edge from-layer="10849" from-port="0" to-layer="10850" to-port="1" /> + <edge from-layer="10850" from-port="2" to-layer="10851" to-port="0" /> + <edge from-layer="10851" from-port="1" to-layer="10852" to-port="1" /> + <edge from-layer="10852" from-port="2" to-layer="10855" to-port="0" /> + <edge from-layer="10853" from-port="0" to-layer="10854" to-port="0" /> + <edge from-layer="10854" from-port="1" to-layer="10855" to-port="1" /> + <edge from-layer="10855" from-port="2" to-layer="10857" to-port="0" /> + <edge from-layer="10856" from-port="0" to-layer="10857" to-port="1" /> + <edge from-layer="10857" from-port="2" to-layer="10859" to-port="0" /> + <edge from-layer="10858" from-port="0" to-layer="10859" to-port="1" /> + <edge from-layer="10859" from-port="2" to-layer="10877" to-port="0" /> + <edge from-layer="10859" from-port="2" to-layer="10871" to-port="0" /> + <edge from-layer="10859" from-port="2" to-layer="10861" to-port="0" /> + <edge from-layer="10859" from-port="2" to-layer="10860" to-port="0" /> + <edge from-layer="10860" from-port="2" to-layer="10880" to-port="0" /> + <edge from-layer="10861" from-port="1" to-layer="10863" to-port="0" /> + <edge from-layer="10862" from-port="0" to-layer="10863" to-port="2" /> + <edge from-layer="10863" from-port="3" to-layer="10864" to-port="0" /> + <edge from-layer="10864" from-port="2" to-layer="10865" to-port="0" /> + <edge from-layer="10865" from-port="1" to-layer="10867" to-port="0" /> + <edge from-layer="10866" from-port="0" to-layer="10867" to-port="1" /> + <edge from-layer="10867" from-port="2" to-layer="10871" to-port="1" /> + <edge from-layer="10867" from-port="2" to-layer="10877" to-port="2" /> + <edge from-layer="10868" from-port="0" to-layer="10871" to-port="2" /> + <edge from-layer="10869" from-port="0" to-layer="10871" to-port="3" /> + <edge from-layer="10870" from-port="0" to-layer="10871" to-port="4" /> + <edge from-layer="10871" from-port="5" to-layer="10873" to-port="0" /> + <edge from-layer="10872" from-port="0" to-layer="10873" to-port="1" /> + <edge from-layer="10873" from-port="2" to-layer="10878" to-port="0" /> + <edge from-layer="10874" from-port="0" to-layer="10877" to-port="1" /> + <edge from-layer="10875" from-port="0" to-layer="10877" to-port="3" /> + <edge from-layer="10876" from-port="0" to-layer="10877" to-port="4" /> + <edge from-layer="10877" from-port="5" to-layer="10878" to-port="1" /> + <edge from-layer="10878" from-port="2" to-layer="10879" to-port="0" /> + <edge from-layer="10879" from-port="2" to-layer="10880" to-port="1" /> + <edge from-layer="10880" from-port="2" to-layer="10997" to-port="0" /> + <edge from-layer="10881" from-port="0" to-layer="10886" to-port="0" /> + <edge from-layer="10882" from-port="0" to-layer="10885" to-port="1" /> + <edge from-layer="10883" from-port="0" to-layer="10885" to-port="2" /> + <edge from-layer="10884" from-port="0" to-layer="10885" to-port="3" /> + <edge from-layer="10885" from-port="4" to-layer="10886" to-port="1" /> + <edge from-layer="10886" from-port="2" to-layer="10887" to-port="0" /> + <edge from-layer="10887" from-port="1" to-layer="10889" to-port="0" /> + <edge from-layer="10888" from-port="0" to-layer="10889" to-port="2" /> + <edge from-layer="10889" from-port="3" to-layer="10929" to-port="0" /> + <edge from-layer="10889" from-port="3" to-layer="10985" to-port="0" /> + <edge from-layer="10890" from-port="0" to-layer="10891" to-port="0" /> + <edge from-layer="10891" from-port="1" to-layer="10894" to-port="0" /> + <edge from-layer="10892" from-port="0" to-layer="10893" to-port="0" /> + <edge from-layer="10893" from-port="1" to-layer="10894" to-port="1" /> + <edge from-layer="10894" from-port="2" to-layer="10896" to-port="0" /> + <edge from-layer="10895" from-port="0" to-layer="10896" to-port="1" /> + <edge from-layer="10896" from-port="2" to-layer="10898" to-port="0" /> + <edge from-layer="10897" from-port="0" to-layer="10898" to-port="1" /> + <edge from-layer="10898" from-port="2" to-layer="10899" to-port="0" /> + <edge from-layer="10899" from-port="1" to-layer="10900" to-port="1" /> + <edge from-layer="10900" from-port="2" to-layer="10903" to-port="0" /> + <edge from-layer="10901" from-port="0" to-layer="10902" to-port="0" /> + <edge from-layer="10902" from-port="1" to-layer="10903" to-port="1" /> + <edge from-layer="10903" from-port="2" to-layer="10905" to-port="0" /> + <edge from-layer="10904" from-port="0" to-layer="10905" to-port="1" /> + <edge from-layer="10905" from-port="2" to-layer="10907" to-port="0" /> + <edge from-layer="10906" from-port="0" to-layer="10907" to-port="1" /> + <edge from-layer="10907" from-port="2" to-layer="10925" to-port="0" /> + <edge from-layer="10907" from-port="2" to-layer="10919" to-port="0" /> + <edge from-layer="10907" from-port="2" to-layer="10908" to-port="0" /> + <edge from-layer="10907" from-port="2" to-layer="10909" to-port="0" /> + <edge from-layer="10908" from-port="2" to-layer="10928" to-port="0" /> + <edge from-layer="10909" from-port="1" to-layer="10911" to-port="0" /> + <edge from-layer="10910" from-port="0" to-layer="10911" to-port="2" /> + <edge from-layer="10911" from-port="3" to-layer="10912" to-port="0" /> + <edge from-layer="10912" from-port="2" to-layer="10913" to-port="0" /> + <edge from-layer="10913" from-port="1" to-layer="10915" to-port="0" /> + <edge from-layer="10914" from-port="0" to-layer="10915" to-port="1" /> + <edge from-layer="10915" from-port="2" to-layer="10919" to-port="1" /> + <edge from-layer="10915" from-port="2" to-layer="10925" to-port="2" /> + <edge from-layer="10916" from-port="0" to-layer="10919" to-port="2" /> + <edge from-layer="10917" from-port="0" to-layer="10919" to-port="3" /> + <edge from-layer="10918" from-port="0" to-layer="10919" to-port="4" /> + <edge from-layer="10919" from-port="5" to-layer="10921" to-port="0" /> + <edge from-layer="10920" from-port="0" to-layer="10921" to-port="1" /> + <edge from-layer="10921" from-port="2" to-layer="10926" to-port="0" /> + <edge from-layer="10922" from-port="0" to-layer="10925" to-port="1" /> + <edge from-layer="10923" from-port="0" to-layer="10925" to-port="3" /> + <edge from-layer="10924" from-port="0" to-layer="10925" to-port="4" /> + <edge from-layer="10925" from-port="5" to-layer="10926" to-port="1" /> + <edge from-layer="10926" from-port="2" to-layer="10927" to-port="0" /> + <edge from-layer="10927" from-port="2" to-layer="10928" to-port="1" /> + <edge from-layer="10928" from-port="2" to-layer="10929" to-port="1" /> + <edge from-layer="10928" from-port="2" to-layer="10989" to-port="0" /> + <edge from-layer="10929" from-port="2" to-layer="10930" to-port="0" /> + <edge from-layer="10929" from-port="2" to-layer="10931" to-port="0" /> + <edge from-layer="10929" from-port="2" to-layer="11144" to-port="0" /> + <edge from-layer="10930" from-port="2" to-layer="10940" to-port="0" /> + <edge from-layer="10931" from-port="1" to-layer="10938" to-port="0" /> + <edge from-layer="10931" from-port="1" to-layer="10934" to-port="0" /> + <edge from-layer="10932" from-port="0" to-layer="10934" to-port="1" /> + <edge from-layer="10933" from-port="0" to-layer="10934" to-port="2" /> + <edge from-layer="10934" from-port="3" to-layer="10939" to-port="0" /> + <edge from-layer="10935" from-port="0" to-layer="10939" to-port="1" /> + <edge from-layer="10936" from-port="0" to-layer="10938" to-port="1" /> + <edge from-layer="10937" from-port="0" to-layer="10938" to-port="2" /> + <edge from-layer="10938" from-port="3" to-layer="10939" to-port="2" /> + <edge from-layer="10939" from-port="3" to-layer="10940" to-port="1" /> + <edge from-layer="10940" from-port="2" to-layer="10942" to-port="0" /> + <edge from-layer="10941" from-port="0" to-layer="10942" to-port="1" /> + <edge from-layer="10942" from-port="2" to-layer="10997" to-port="1" /> + <edge from-layer="10943" from-port="0" to-layer="10948" to-port="0" /> + <edge from-layer="10944" from-port="0" to-layer="10947" to-port="1" /> + <edge from-layer="10945" from-port="0" to-layer="10947" to-port="2" /> + <edge from-layer="10946" from-port="0" to-layer="10947" to-port="3" /> + <edge from-layer="10947" from-port="4" to-layer="10948" to-port="1" /> + <edge from-layer="10948" from-port="2" to-layer="10949" to-port="0" /> + <edge from-layer="10949" from-port="1" to-layer="10951" to-port="0" /> + <edge from-layer="10950" from-port="0" to-layer="10951" to-port="2" /> + <edge from-layer="10951" from-port="3" to-layer="10970" to-port="0" /> + <edge from-layer="10952" from-port="0" to-layer="10953" to-port="0" /> + <edge from-layer="10953" from-port="1" to-layer="10956" to-port="0" /> + <edge from-layer="10954" from-port="0" to-layer="10955" to-port="0" /> + <edge from-layer="10955" from-port="1" to-layer="10956" to-port="1" /> + <edge from-layer="10956" from-port="2" to-layer="10958" to-port="0" /> + <edge from-layer="10957" from-port="0" to-layer="10958" to-port="1" /> + <edge from-layer="10958" from-port="2" to-layer="10960" to-port="0" /> + <edge from-layer="10959" from-port="0" to-layer="10960" to-port="1" /> + <edge from-layer="10960" from-port="2" to-layer="10961" to-port="0" /> + <edge from-layer="10961" from-port="1" to-layer="10962" to-port="1" /> + <edge from-layer="10962" from-port="2" to-layer="10965" to-port="0" /> + <edge from-layer="10963" from-port="0" to-layer="10964" to-port="0" /> + <edge from-layer="10964" from-port="1" to-layer="10965" to-port="1" /> + <edge from-layer="10965" from-port="2" to-layer="10967" to-port="0" /> + <edge from-layer="10966" from-port="0" to-layer="10967" to-port="1" /> + <edge from-layer="10967" from-port="2" to-layer="10969" to-port="0" /> + <edge from-layer="10968" from-port="0" to-layer="10969" to-port="1" /> + <edge from-layer="10969" from-port="2" to-layer="10970" to-port="1" /> + <edge from-layer="10970" from-port="2" to-layer="11143" to-port="0" /> + <edge from-layer="10970" from-port="2" to-layer="10972" to-port="0" /> + <edge from-layer="10970" from-port="2" to-layer="10971" to-port="0" /> + <edge from-layer="10971" from-port="2" to-layer="10981" to-port="0" /> + <edge from-layer="10972" from-port="1" to-layer="10975" to-port="0" /> + <edge from-layer="10972" from-port="1" to-layer="10979" to-port="0" /> + <edge from-layer="10973" from-port="0" to-layer="10975" to-port="1" /> + <edge from-layer="10974" from-port="0" to-layer="10975" to-port="2" /> + <edge from-layer="10975" from-port="3" to-layer="10980" to-port="1" /> + <edge from-layer="10976" from-port="0" to-layer="10980" to-port="2" /> + <edge from-layer="10977" from-port="0" to-layer="10979" to-port="1" /> + <edge from-layer="10978" from-port="0" to-layer="10979" to-port="2" /> + <edge from-layer="10979" from-port="3" to-layer="10980" to-port="3" /> + <edge from-layer="10980" from-port="4" to-layer="10981" to-port="1" /> + <edge from-layer="10981" from-port="2" to-layer="10983" to-port="0" /> + <edge from-layer="10982" from-port="0" to-layer="10983" to-port="1" /> + <edge from-layer="10983" from-port="2" to-layer="10997" to-port="2" /> + <edge from-layer="10984" from-port="0" to-layer="10996" to-port="1" /> + <edge from-layer="10985" from-port="1" to-layer="10988" to-port="0" /> + <edge from-layer="10986" from-port="0" to-layer="10988" to-port="1" /> + <edge from-layer="10987" from-port="0" to-layer="10988" to-port="2" /> + <edge from-layer="10988" from-port="3" to-layer="10993" to-port="0" /> + <edge from-layer="10989" from-port="1" to-layer="10992" to-port="0" /> + <edge from-layer="10990" from-port="0" to-layer="10992" to-port="1" /> + <edge from-layer="10991" from-port="0" to-layer="10992" to-port="2" /> + <edge from-layer="10992" from-port="3" to-layer="10993" to-port="1" /> + <edge from-layer="10993" from-port="2" to-layer="10996" to-port="2" /> + <edge from-layer="10994" from-port="0" to-layer="10996" to-port="3" /> + <edge from-layer="10995" from-port="0" to-layer="10996" to-port="4" /> + <edge from-layer="10996" from-port="5" to-layer="10997" to-port="3" /> + <edge from-layer="10997" from-port="4" to-layer="10999" to-port="0" /> + <edge from-layer="10998" from-port="0" to-layer="10999" to-port="1" /> + <edge from-layer="10999" from-port="2" to-layer="11001" to-port="0" /> + <edge from-layer="11000" from-port="0" to-layer="11001" to-port="1" /> + <edge from-layer="11001" from-port="2" to-layer="11012" to-port="0" /> + <edge from-layer="11002" from-port="0" to-layer="11003" to-port="0" /> + <edge from-layer="11003" from-port="1" to-layer="11006" to-port="0" /> + <edge from-layer="11004" from-port="0" to-layer="11005" to-port="0" /> + <edge from-layer="11005" from-port="1" to-layer="11006" to-port="1" /> + <edge from-layer="11006" from-port="2" to-layer="11008" to-port="0" /> + <edge from-layer="11007" from-port="0" to-layer="11008" to-port="1" /> + <edge from-layer="11008" from-port="2" to-layer="11010" to-port="0" /> + <edge from-layer="11009" from-port="0" to-layer="11010" to-port="1" /> + <edge from-layer="11010" from-port="2" to-layer="11011" to-port="0" /> + <edge from-layer="11011" from-port="1" to-layer="11012" to-port="1" /> + <edge from-layer="11012" from-port="2" to-layer="11013" to-port="1" /> + <edge from-layer="11013" from-port="2" to-layer="11024" to-port="0" /> + <edge from-layer="11013" from-port="2" to-layer="11017" to-port="0" /> + <edge from-layer="11013" from-port="2" to-layer="11061" to-port="0" /> + <edge from-layer="11014" from-port="0" to-layer="11025" to-port="0" /> + <edge from-layer="11015" from-port="0" to-layer="11023" to-port="0" /> + <edge from-layer="11016" from-port="0" to-layer="11017" to-port="1" /> + <edge from-layer="11017" from-port="2" to-layer="11019" to-port="0" /> + <edge from-layer="11018" from-port="0" to-layer="11019" to-port="1" /> + <edge from-layer="11019" from-port="2" to-layer="11021" to-port="0" /> + <edge from-layer="11020" from-port="0" to-layer="11021" to-port="1" /> + <edge from-layer="11021" from-port="2" to-layer="11022" to-port="0" /> + <edge from-layer="11022" from-port="1" to-layer="11023" to-port="1" /> + <edge from-layer="11023" from-port="2" to-layer="11024" to-port="1" /> + <edge from-layer="11024" from-port="2" to-layer="11025" to-port="1" /> + <edge from-layer="11025" from-port="2" to-layer="11036" to-port="0" /> + <edge from-layer="11025" from-port="2" to-layer="11048" to-port="0" /> + <edge from-layer="11026" from-port="0" to-layer="11027" to-port="0" /> + <edge from-layer="11027" from-port="1" to-layer="11030" to-port="0" /> + <edge from-layer="11028" from-port="0" to-layer="11029" to-port="0" /> + <edge from-layer="11029" from-port="1" to-layer="11030" to-port="1" /> + <edge from-layer="11030" from-port="2" to-layer="11032" to-port="0" /> + <edge from-layer="11031" from-port="0" to-layer="11032" to-port="1" /> + <edge from-layer="11032" from-port="2" to-layer="11034" to-port="0" /> + <edge from-layer="11033" from-port="0" to-layer="11034" to-port="1" /> + <edge from-layer="11034" from-port="2" to-layer="11035" to-port="0" /> + <edge from-layer="11035" from-port="1" to-layer="11036" to-port="1" /> + <edge from-layer="11036" from-port="2" to-layer="11037" to-port="0" /> + <edge from-layer="11037" from-port="1" to-layer="11049" to-port="0" /> + <edge from-layer="11038" from-port="0" to-layer="11039" to-port="0" /> + <edge from-layer="11039" from-port="1" to-layer="11042" to-port="0" /> + <edge from-layer="11040" from-port="0" to-layer="11041" to-port="0" /> + <edge from-layer="11041" from-port="1" to-layer="11042" to-port="1" /> + <edge from-layer="11042" from-port="2" to-layer="11044" to-port="0" /> + <edge from-layer="11043" from-port="0" to-layer="11044" to-port="1" /> + <edge from-layer="11044" from-port="2" to-layer="11046" to-port="0" /> + <edge from-layer="11045" from-port="0" to-layer="11046" to-port="1" /> + <edge from-layer="11046" from-port="2" to-layer="11047" to-port="0" /> + <edge from-layer="11047" from-port="1" to-layer="11048" to-port="1" /> + <edge from-layer="11048" from-port="2" to-layer="11049" to-port="1" /> + <edge from-layer="11049" from-port="2" to-layer="11060" to-port="0" /> + <edge from-layer="11050" from-port="0" to-layer="11051" to-port="0" /> + <edge from-layer="11051" from-port="1" to-layer="11054" to-port="0" /> + <edge from-layer="11052" from-port="0" to-layer="11053" to-port="0" /> + <edge from-layer="11053" from-port="1" to-layer="11054" to-port="1" /> + <edge from-layer="11054" from-port="2" to-layer="11056" to-port="0" /> + <edge from-layer="11055" from-port="0" to-layer="11056" to-port="1" /> + <edge from-layer="11056" from-port="2" to-layer="11058" to-port="0" /> + <edge from-layer="11057" from-port="0" to-layer="11058" to-port="1" /> + <edge from-layer="11058" from-port="2" to-layer="11059" to-port="0" /> + <edge from-layer="11059" from-port="1" to-layer="11060" to-port="1" /> + <edge from-layer="11060" from-port="2" to-layer="11061" to-port="1" /> + <edge from-layer="11061" from-port="2" to-layer="11071" to-port="0" /> + <edge from-layer="11061" from-port="2" to-layer="11322" to-port="0" /> + <edge from-layer="11061" from-port="2" to-layer="11064" to-port="0" /> + <edge from-layer="11062" from-port="0" to-layer="11070" to-port="0" /> + <edge from-layer="11063" from-port="0" to-layer="11064" to-port="1" /> + <edge from-layer="11064" from-port="2" to-layer="11066" to-port="0" /> + <edge from-layer="11065" from-port="0" to-layer="11066" to-port="1" /> + <edge from-layer="11066" from-port="2" to-layer="11068" to-port="0" /> + <edge from-layer="11067" from-port="0" to-layer="11068" to-port="1" /> + <edge from-layer="11068" from-port="2" to-layer="11069" to-port="0" /> + <edge from-layer="11069" from-port="1" to-layer="11070" to-port="1" /> + <edge from-layer="11070" from-port="2" to-layer="11071" to-port="1" /> + <edge from-layer="11071" from-port="2" to-layer="11072" to-port="1" /> + <edge from-layer="11072" from-port="2" to-layer="11112" to-port="0" /> + <edge from-layer="11072" from-port="2" to-layer="11238" to-port="0" /> + <edge from-layer="11072" from-port="2" to-layer="11083" to-port="0" /> + <edge from-layer="11073" from-port="0" to-layer="11074" to-port="0" /> + <edge from-layer="11074" from-port="1" to-layer="11077" to-port="0" /> + <edge from-layer="11075" from-port="0" to-layer="11076" to-port="0" /> + <edge from-layer="11076" from-port="1" to-layer="11077" to-port="1" /> + <edge from-layer="11077" from-port="2" to-layer="11079" to-port="0" /> + <edge from-layer="11078" from-port="0" to-layer="11079" to-port="1" /> + <edge from-layer="11079" from-port="2" to-layer="11081" to-port="0" /> + <edge from-layer="11080" from-port="0" to-layer="11081" to-port="1" /> + <edge from-layer="11081" from-port="2" to-layer="11082" to-port="0" /> + <edge from-layer="11082" from-port="1" to-layer="11083" to-port="1" /> + <edge from-layer="11083" from-port="2" to-layer="11086" to-port="0" /> + <edge from-layer="11084" from-port="0" to-layer="11085" to-port="0" /> + <edge from-layer="11085" from-port="1" to-layer="11086" to-port="1" /> + <edge from-layer="11086" from-port="2" to-layer="11088" to-port="0" /> + <edge from-layer="11087" from-port="0" to-layer="11088" to-port="1" /> + <edge from-layer="11088" from-port="2" to-layer="11090" to-port="0" /> + <edge from-layer="11089" from-port="0" to-layer="11090" to-port="1" /> + <edge from-layer="11090" from-port="2" to-layer="11091" to-port="1" /> + <edge from-layer="11091" from-port="2" to-layer="11280" to-port="0" /> + <edge from-layer="11091" from-port="2" to-layer="11281" to-port="0" /> + <edge from-layer="11091" from-port="2" to-layer="11092" to-port="0" /> + <edge from-layer="11093" from-port="0" to-layer="11098" to-port="0" /> + <edge from-layer="11094" from-port="0" to-layer="11097" to-port="1" /> + <edge from-layer="11095" from-port="0" to-layer="11097" to-port="2" /> + <edge from-layer="11096" from-port="0" to-layer="11097" to-port="3" /> + <edge from-layer="11097" from-port="4" to-layer="11098" to-port="1" /> + <edge from-layer="11098" from-port="2" to-layer="11099" to-port="0" /> + <edge from-layer="11099" from-port="1" to-layer="11101" to-port="0" /> + <edge from-layer="11100" from-port="0" to-layer="11101" to-port="2" /> + <edge from-layer="11101" from-port="3" to-layer="11294" to-port="0" /> + <edge from-layer="11101" from-port="3" to-layer="11141" to-port="0" /> + <edge from-layer="11102" from-port="0" to-layer="11103" to-port="0" /> + <edge from-layer="11103" from-port="1" to-layer="11106" to-port="0" /> + <edge from-layer="11104" from-port="0" to-layer="11105" to-port="0" /> + <edge from-layer="11105" from-port="1" to-layer="11106" to-port="1" /> + <edge from-layer="11106" from-port="2" to-layer="11108" to-port="0" /> + <edge from-layer="11107" from-port="0" to-layer="11108" to-port="1" /> + <edge from-layer="11108" from-port="2" to-layer="11110" to-port="0" /> + <edge from-layer="11109" from-port="0" to-layer="11110" to-port="1" /> + <edge from-layer="11110" from-port="2" to-layer="11111" to-port="0" /> + <edge from-layer="11111" from-port="1" to-layer="11112" to-port="1" /> + <edge from-layer="11112" from-port="2" to-layer="11115" to-port="0" /> + <edge from-layer="11113" from-port="0" to-layer="11114" to-port="0" /> + <edge from-layer="11114" from-port="1" to-layer="11115" to-port="1" /> + <edge from-layer="11115" from-port="2" to-layer="11117" to-port="0" /> + <edge from-layer="11116" from-port="0" to-layer="11117" to-port="1" /> + <edge from-layer="11117" from-port="2" to-layer="11119" to-port="0" /> + <edge from-layer="11118" from-port="0" to-layer="11119" to-port="1" /> + <edge from-layer="11119" from-port="2" to-layer="11137" to-port="0" /> + <edge from-layer="11119" from-port="2" to-layer="11121" to-port="0" /> + <edge from-layer="11119" from-port="2" to-layer="11131" to-port="0" /> + <edge from-layer="11119" from-port="2" to-layer="11120" to-port="0" /> + <edge from-layer="11120" from-port="2" to-layer="11140" to-port="0" /> + <edge from-layer="11121" from-port="1" to-layer="11123" to-port="0" /> + <edge from-layer="11122" from-port="0" to-layer="11123" to-port="2" /> + <edge from-layer="11123" from-port="3" to-layer="11124" to-port="0" /> + <edge from-layer="11124" from-port="2" to-layer="11125" to-port="0" /> + <edge from-layer="11125" from-port="1" to-layer="11127" to-port="0" /> + <edge from-layer="11126" from-port="0" to-layer="11127" to-port="1" /> + <edge from-layer="11127" from-port="2" to-layer="11131" to-port="1" /> + <edge from-layer="11127" from-port="2" to-layer="11137" to-port="2" /> + <edge from-layer="11128" from-port="0" to-layer="11131" to-port="2" /> + <edge from-layer="11129" from-port="0" to-layer="11131" to-port="3" /> + <edge from-layer="11130" from-port="0" to-layer="11131" to-port="4" /> + <edge from-layer="11131" from-port="5" to-layer="11133" to-port="0" /> + <edge from-layer="11132" from-port="0" to-layer="11133" to-port="1" /> + <edge from-layer="11133" from-port="2" to-layer="11138" to-port="0" /> + <edge from-layer="11134" from-port="0" to-layer="11137" to-port="1" /> + <edge from-layer="11135" from-port="0" to-layer="11137" to-port="3" /> + <edge from-layer="11136" from-port="0" to-layer="11137" to-port="4" /> + <edge from-layer="11137" from-port="5" to-layer="11138" to-port="1" /> + <edge from-layer="11138" from-port="2" to-layer="11139" to-port="0" /> + <edge from-layer="11139" from-port="2" to-layer="11140" to-port="1" /> + <edge from-layer="11140" from-port="2" to-layer="11298" to-port="0" /> + <edge from-layer="11140" from-port="2" to-layer="11141" to-port="1" /> + <edge from-layer="11141" from-port="2" to-layer="11267" to-port="0" /> + <edge from-layer="11141" from-port="2" to-layer="11142" to-port="0" /> + <edge from-layer="11141" from-port="2" to-layer="11268" to-port="0" /> + <edge from-layer="11227" from-port="0" to-layer="11381" to-port="0" /> + <edge from-layer="11228" from-port="0" to-layer="11229" to-port="0" /> + <edge from-layer="11229" from-port="1" to-layer="11232" to-port="0" /> + <edge from-layer="11230" from-port="0" to-layer="11231" to-port="0" /> + <edge from-layer="11231" from-port="1" to-layer="11232" to-port="1" /> + <edge from-layer="11232" from-port="2" to-layer="11234" to-port="0" /> + <edge from-layer="11233" from-port="0" to-layer="11234" to-port="1" /> + <edge from-layer="11234" from-port="2" to-layer="11236" to-port="0" /> + <edge from-layer="11235" from-port="0" to-layer="11236" to-port="1" /> + <edge from-layer="11236" from-port="2" to-layer="11237" to-port="0" /> + <edge from-layer="11237" from-port="1" to-layer="11238" to-port="1" /> + <edge from-layer="11238" from-port="2" to-layer="11241" to-port="0" /> + <edge from-layer="11239" from-port="0" to-layer="11240" to-port="0" /> + <edge from-layer="11240" from-port="1" to-layer="11241" to-port="1" /> + <edge from-layer="11241" from-port="2" to-layer="11243" to-port="0" /> + <edge from-layer="11242" from-port="0" to-layer="11243" to-port="1" /> + <edge from-layer="11243" from-port="2" to-layer="11245" to-port="0" /> + <edge from-layer="11244" from-port="0" to-layer="11245" to-port="1" /> + <edge from-layer="11245" from-port="2" to-layer="11257" to-port="0" /> + <edge from-layer="11245" from-port="2" to-layer="11263" to-port="0" /> + <edge from-layer="11245" from-port="2" to-layer="11246" to-port="0" /> + <edge from-layer="11245" from-port="2" to-layer="11247" to-port="0" /> + <edge from-layer="11246" from-port="2" to-layer="11266" to-port="0" /> + <edge from-layer="11247" from-port="1" to-layer="11249" to-port="0" /> + <edge from-layer="11248" from-port="0" to-layer="11249" to-port="2" /> + <edge from-layer="11249" from-port="3" to-layer="11250" to-port="0" /> + <edge from-layer="11250" from-port="2" to-layer="11251" to-port="0" /> + <edge from-layer="11251" from-port="1" to-layer="11253" to-port="0" /> + <edge from-layer="11252" from-port="0" to-layer="11253" to-port="1" /> + <edge from-layer="11253" from-port="2" to-layer="11257" to-port="1" /> + <edge from-layer="11253" from-port="2" to-layer="11263" to-port="2" /> + <edge from-layer="11254" from-port="0" to-layer="11257" to-port="2" /> + <edge from-layer="11255" from-port="0" to-layer="11257" to-port="3" /> + <edge from-layer="11256" from-port="0" to-layer="11257" to-port="4" /> + <edge from-layer="11257" from-port="5" to-layer="11259" to-port="0" /> + <edge from-layer="11258" from-port="0" to-layer="11259" to-port="1" /> + <edge from-layer="11259" from-port="2" to-layer="11264" to-port="0" /> + <edge from-layer="11260" from-port="0" to-layer="11263" to-port="1" /> + <edge from-layer="11261" from-port="0" to-layer="11263" to-port="3" /> + <edge from-layer="11262" from-port="0" to-layer="11263" to-port="4" /> + <edge from-layer="11263" from-port="5" to-layer="11264" to-port="1" /> + <edge from-layer="11264" from-port="2" to-layer="11265" to-port="0" /> + <edge from-layer="11265" from-port="2" to-layer="11266" to-port="1" /> + <edge from-layer="11266" from-port="2" to-layer="11306" to-port="0" /> + <edge from-layer="11267" from-port="2" to-layer="11277" to-port="0" /> + <edge from-layer="11268" from-port="1" to-layer="11275" to-port="0" /> + <edge from-layer="11268" from-port="1" to-layer="11271" to-port="0" /> + <edge from-layer="11269" from-port="0" to-layer="11271" to-port="1" /> + <edge from-layer="11270" from-port="0" to-layer="11271" to-port="2" /> + <edge from-layer="11271" from-port="3" to-layer="11276" to-port="0" /> + <edge from-layer="11272" from-port="0" to-layer="11276" to-port="1" /> + <edge from-layer="11273" from-port="0" to-layer="11275" to-port="1" /> + <edge from-layer="11274" from-port="0" to-layer="11275" to-port="2" /> + <edge from-layer="11275" from-port="3" to-layer="11276" to-port="2" /> + <edge from-layer="11276" from-port="3" to-layer="11277" to-port="1" /> + <edge from-layer="11277" from-port="2" to-layer="11279" to-port="0" /> + <edge from-layer="11278" from-port="0" to-layer="11279" to-port="1" /> + <edge from-layer="11279" from-port="2" to-layer="11306" to-port="1" /> + <edge from-layer="11280" from-port="2" to-layer="11290" to-port="0" /> + <edge from-layer="11281" from-port="1" to-layer="11288" to-port="0" /> + <edge from-layer="11281" from-port="1" to-layer="11284" to-port="0" /> + <edge from-layer="11282" from-port="0" to-layer="11284" to-port="1" /> + <edge from-layer="11283" from-port="0" to-layer="11284" to-port="2" /> + <edge from-layer="11284" from-port="3" to-layer="11289" to-port="1" /> + <edge from-layer="11285" from-port="0" to-layer="11289" to-port="2" /> + <edge from-layer="11286" from-port="0" to-layer="11288" to-port="1" /> + <edge from-layer="11287" from-port="0" to-layer="11288" to-port="2" /> + <edge from-layer="11288" from-port="3" to-layer="11289" to-port="3" /> + <edge from-layer="11289" from-port="4" to-layer="11290" to-port="1" /> + <edge from-layer="11290" from-port="2" to-layer="11292" to-port="0" /> + <edge from-layer="11291" from-port="0" to-layer="11292" to-port="1" /> + <edge from-layer="11292" from-port="2" to-layer="11306" to-port="2" /> + <edge from-layer="11293" from-port="0" to-layer="11305" to-port="1" /> + <edge from-layer="11294" from-port="1" to-layer="11297" to-port="0" /> + <edge from-layer="11295" from-port="0" to-layer="11297" to-port="1" /> + <edge from-layer="11296" from-port="0" to-layer="11297" to-port="2" /> + <edge from-layer="11297" from-port="3" to-layer="11302" to-port="0" /> + <edge from-layer="11298" from-port="1" to-layer="11301" to-port="0" /> + <edge from-layer="11299" from-port="0" to-layer="11301" to-port="1" /> + <edge from-layer="11300" from-port="0" to-layer="11301" to-port="2" /> + <edge from-layer="11301" from-port="3" to-layer="11302" to-port="1" /> + <edge from-layer="11302" from-port="2" to-layer="11305" to-port="2" /> + <edge from-layer="11303" from-port="0" to-layer="11305" to-port="3" /> + <edge from-layer="11304" from-port="0" to-layer="11305" to-port="4" /> + <edge from-layer="11305" from-port="5" to-layer="11306" to-port="3" /> + <edge from-layer="11306" from-port="4" to-layer="11308" to-port="0" /> + <edge from-layer="11307" from-port="0" to-layer="11308" to-port="1" /> + <edge from-layer="11308" from-port="2" to-layer="11310" to-port="0" /> + <edge from-layer="11309" from-port="0" to-layer="11310" to-port="1" /> + <edge from-layer="11310" from-port="2" to-layer="11321" to-port="0" /> + <edge from-layer="11311" from-port="0" to-layer="11312" to-port="0" /> + <edge from-layer="11312" from-port="1" to-layer="11315" to-port="0" /> + <edge from-layer="11313" from-port="0" to-layer="11314" to-port="0" /> + <edge from-layer="11314" from-port="1" to-layer="11315" to-port="1" /> + <edge from-layer="11315" from-port="2" to-layer="11317" to-port="0" /> + <edge from-layer="11316" from-port="0" to-layer="11317" to-port="1" /> + <edge from-layer="11317" from-port="2" to-layer="11319" to-port="0" /> + <edge from-layer="11318" from-port="0" to-layer="11319" to-port="1" /> + <edge from-layer="11319" from-port="2" to-layer="11320" to-port="0" /> + <edge from-layer="11320" from-port="1" to-layer="11321" to-port="1" /> + <edge from-layer="11321" from-port="2" to-layer="11322" to-port="1" /> + <edge from-layer="11322" from-port="2" to-layer="11326" to-port="0" /> + <edge from-layer="11322" from-port="2" to-layer="11370" to-port="0" /> + <edge from-layer="11322" from-port="2" to-layer="11333" to-port="0" /> + <edge from-layer="11323" from-port="0" to-layer="11334" to-port="0" /> + <edge from-layer="11324" from-port="0" to-layer="11332" to-port="0" /> + <edge from-layer="11325" from-port="0" to-layer="11326" to-port="1" /> + <edge from-layer="11326" from-port="2" to-layer="11328" to-port="0" /> + <edge from-layer="11327" from-port="0" to-layer="11328" to-port="1" /> + <edge from-layer="11328" from-port="2" to-layer="11330" to-port="0" /> + <edge from-layer="11329" from-port="0" to-layer="11330" to-port="1" /> + <edge from-layer="11330" from-port="2" to-layer="11331" to-port="0" /> + <edge from-layer="11331" from-port="1" to-layer="11332" to-port="1" /> + <edge from-layer="11332" from-port="2" to-layer="11333" to-port="1" /> + <edge from-layer="11333" from-port="2" to-layer="11334" to-port="1" /> + <edge from-layer="11334" from-port="2" to-layer="11357" to-port="0" /> + <edge from-layer="11334" from-port="2" to-layer="11345" to-port="0" /> + <edge from-layer="11335" from-port="0" to-layer="11336" to-port="0" /> + <edge from-layer="11336" from-port="1" to-layer="11339" to-port="0" /> + <edge from-layer="11337" from-port="0" to-layer="11338" to-port="0" /> + <edge from-layer="11338" from-port="1" to-layer="11339" to-port="1" /> + <edge from-layer="11339" from-port="2" to-layer="11341" to-port="0" /> + <edge from-layer="11340" from-port="0" to-layer="11341" to-port="1" /> + <edge from-layer="11341" from-port="2" to-layer="11343" to-port="0" /> + <edge from-layer="11342" from-port="0" to-layer="11343" to-port="1" /> + <edge from-layer="11343" from-port="2" to-layer="11344" to-port="0" /> + <edge from-layer="11344" from-port="1" to-layer="11345" to-port="1" /> + <edge from-layer="11345" from-port="2" to-layer="11346" to-port="0" /> + <edge from-layer="11346" from-port="1" to-layer="11358" to-port="0" /> + <edge from-layer="11347" from-port="0" to-layer="11348" to-port="0" /> + <edge from-layer="11348" from-port="1" to-layer="11351" to-port="0" /> + <edge from-layer="11349" from-port="0" to-layer="11350" to-port="0" /> + <edge from-layer="11350" from-port="1" to-layer="11351" to-port="1" /> + <edge from-layer="11351" from-port="2" to-layer="11353" to-port="0" /> + <edge from-layer="11352" from-port="0" to-layer="11353" to-port="1" /> + <edge from-layer="11353" from-port="2" to-layer="11355" to-port="0" /> + <edge from-layer="11354" from-port="0" to-layer="11355" to-port="1" /> + <edge from-layer="11355" from-port="2" to-layer="11356" to-port="0" /> + <edge from-layer="11356" from-port="1" to-layer="11357" to-port="1" /> + <edge from-layer="11357" from-port="2" to-layer="11358" to-port="1" /> + <edge from-layer="11358" from-port="2" to-layer="11369" to-port="0" /> + <edge from-layer="11359" from-port="0" to-layer="11360" to-port="0" /> + <edge from-layer="11360" from-port="1" to-layer="11363" to-port="0" /> + <edge from-layer="11361" from-port="0" to-layer="11362" to-port="0" /> + <edge from-layer="11362" from-port="1" to-layer="11363" to-port="1" /> + <edge from-layer="11363" from-port="2" to-layer="11365" to-port="0" /> + <edge from-layer="11364" from-port="0" to-layer="11365" to-port="1" /> + <edge from-layer="11365" from-port="2" to-layer="11367" to-port="0" /> + <edge from-layer="11366" from-port="0" to-layer="11367" to-port="1" /> + <edge from-layer="11367" from-port="2" to-layer="11368" to-port="0" /> + <edge from-layer="11368" from-port="1" to-layer="11369" to-port="1" /> + <edge from-layer="11369" from-port="2" to-layer="11370" to-port="1" /> + <edge from-layer="11370" from-port="2" to-layer="11373" to-port="0" /> + <edge from-layer="11370" from-port="2" to-layer="11380" to-port="0" /> + <edge from-layer="11371" from-port="0" to-layer="11379" to-port="0" /> + <edge from-layer="11372" from-port="0" to-layer="11373" to-port="1" /> + <edge from-layer="11373" from-port="2" to-layer="11375" to-port="0" /> + <edge from-layer="11374" from-port="0" to-layer="11375" to-port="1" /> + <edge from-layer="11375" from-port="2" to-layer="11377" to-port="0" /> + <edge from-layer="11376" from-port="0" to-layer="11377" to-port="1" /> + <edge from-layer="11377" from-port="2" to-layer="11378" to-port="0" /> + <edge from-layer="11378" from-port="1" to-layer="11379" to-port="1" /> + <edge from-layer="11379" from-port="2" to-layer="11380" to-port="1" /> + <edge from-layer="11380" from-port="2" to-layer="11381" to-port="1" /> + <edge from-layer="11381" from-port="2" to-layer="11390" to-port="0" /> + <edge from-layer="11382" from-port="0" to-layer="11383" to-port="0" /> + <edge from-layer="11383" from-port="1" to-layer="11386" to-port="0" /> + <edge from-layer="11384" from-port="0" to-layer="11385" to-port="0" /> + <edge from-layer="11385" from-port="1" to-layer="11386" to-port="1" /> + <edge from-layer="11386" from-port="2" to-layer="11388" to-port="0" /> + <edge from-layer="11387" from-port="0" to-layer="11388" to-port="1" /> + <edge from-layer="11388" from-port="2" to-layer="11389" to-port="0" /> + <edge from-layer="11389" from-port="1" to-layer="11390" to-port="1" /> + <edge from-layer="11390" from-port="2" to-layer="11391" to-port="0" /> + </edges> + <rt_info> + <Runtime_version value="2024.4.0-16579-c3152d32c9c-releases/2024/4" /> + <conversion_parameters> + <framework value="pytorch" /> + <is_python_object value="True" /> + </conversion_parameters> + <nncf> + <friendly_names_were_updated value="True" /> + <weight_compression> + <advanced_parameters value="{'awq_params': {'subset_size': 32, 'percent_to_apply': 0.002, 'alpha_min': 0.0, 'alpha_max': 1.0, 'steps': 100}, 'scale_estimation_params': {'subset_size': 64, 'initial_steps': 5, 'scale_steps': 5, 'weight_penalty': -1.0}, 'gptq_params': {'damp_percent': 0.1, 'block_size': 128, 'subset_size': 128}, 'lora_correction_params': {'adapter_rank': 8, 'num_iterations': 3, 'apply_regularization': True, 'subset_size': 128, 'use_int8_adapters': True}}" /> + <all_layers value="False" /> + <awq value="False" /> + <gptq value="False" /> + <group_size value="128" /> + <ignored_scope value="[]" /> + <lora_correction value="False" /> + <mode value="int4_asym" /> + <ratio value="1.0" /> + <scale_estimation value="False" /> + <sensitivity_metric value="weight_quantization_error" /> + </weight_compression> + </nncf> + <optimum> + <optimum_intel_version value="1.20.0" /> + <optimum_version value="1.23.0" /> + <pytorch_version value="2.4.1" /> + <transformers_version value="4.45.2" /> + </optimum> + </rt_info> +</net>