<?xml version="1.0"?> <net name="Model0" version="11"> <layers> <layer id="3" name="attention_mask" type="Parameter" version="opset1"> <data shape="?,?" element_type="i64" /> <output> <port id="0" precision="I64" names="attention_mask"> <dim>-1</dim> <dim>-1</dim> </port> </output> </layer> <layer id="2" name="position_ids" type="Parameter" version="opset1"> <data shape="?,?" element_type="i64" /> <output> <port id="0" precision="I64" names="position_ids"> <dim>-1</dim> <dim>-1</dim> </port> </output> </layer> <layer id="1" name="inputs_embeds" type="Parameter" version="opset1"> <data shape="?,?,3072" element_type="f32" /> <output> <port id="0" precision="FP32" names="inputs_embeds"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="0" name="beam_idx" type="Parameter" version="opset1"> <data shape="?" element_type="i32" /> <output> <port id="0" precision="I32" names="beam_idx"> <dim>-1</dim> </port> </output> </layer> <layer id="4" name="Constant_102194_compressed" type="Const" version="opset1"> <data element_type="f16" shape="" offset="0" size="2" /> <output> <port id="0" precision="FP16" /> </output> </layer> <layer id="5" name="Constant_102194" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16" /> </input> <output> <port id="1" precision="FP32" /> </output> </layer> <layer id="6" name="ShapeOf_102180" type="ShapeOf" version="opset3"> <data output_type="i64" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="I64"> <dim>3</dim> </port> </output> </layer> <layer id="7" name="Constant_102182" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="2" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="8" name="Constant_102184" type="Const" version="opset1"> <data element_type="i64" shape="" offset="2" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="9" name="Gather_102185" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="I64"> <dim>3</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="10" name="Constant_102187" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="10" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="11" name="Constant_102189" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="2" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="12" name="Constant_102191" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="18" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="13" name="Concat_102192" type="Concat" version="opset1"> <data axis="0" /> <input> <port id="0" precision="I64"> <dim>1</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="4" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="14" name="Broadcast_102195" type="Broadcast" version="opset3"> <data mode="numpy" /> <input> <port id="0" precision="FP32" /> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>0</dim> <dim>96</dim> </port> </output> </layer> <layer id="15" name="ReadValue_101173" type="ReadValue" version="opset6"> <data variable_id="past_key_values.9.valuepresent.9.value" variable_type="f32" variable_shape="?,32,?,96" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>0</dim> <dim>96</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.9.value"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="16" name="Constant_99908" type="Const" version="opset1"> <data element_type="i64" shape="" offset="2" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="17" name="Gather_99909" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="18" name="Constant_90127_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 3072" offset="26" size="6144" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="19" name="Constant_90127" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="20" name="Constant_90031_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 3072" offset="6170" size="6144" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="21" name="Constant_90031" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="22" name="Constant_90030_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12314" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="23" name="Constant_90030" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="24" name="Constant_90028_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12316" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="25" name="Constant_90028" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="26" name="__module.model.model.layers.0.input_layernorm/aten::pow/Power" type="Power" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="366"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="27" name="Constant_407" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="12318" size="8" /> <output> <port id="0" precision="I64" names="367"> <dim>1</dim> </port> </output> </layer> <layer id="28" name="__module.model.model.layers.0.input_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> <data keep_dims="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="368,variance.1"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="29" name="Constant_90029_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12326" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="30" name="Constant_90029" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="31" name="__module.model.model.layers.0.input_layernorm/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="369"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="32" name="__module.model.model.layers.0.input_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="33" name="__module.model.model.layers.0.input_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> <data auto_broadcast="numpy" m_pythondiv="true" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="370"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="34" name="__module.model.model.layers.0.input_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="371,372,hidden_states.3,hidden_states.5"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="35" name="__module.model.model.layers.0.input_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="373,375,hidden_states.7"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="36" name="self.model.model.layers.0.self_attn.qkv_proj.weight_compressed" type="Const" version="opset1"> <data element_type="f16" shape="9216, 3072" offset="12328" size="56623104" /> <output> <port id="0" precision="FP16" names="self.model.model.layers.0.self_attn.qkv_proj.weight"> <dim>9216</dim> <dim>3072</dim> </port> </output> </layer> <layer id="37" name="self.model.model.layers.0.self_attn.qkv_proj.weight" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>9216</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>9216</dim> <dim>3072</dim> </port> </output> </layer> <layer id="38" name="__module.model.model.layers.0.self_attn.qkv_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>9216</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="382,qkv.1"> <dim>-1</dim> <dim>-1</dim> <dim>9216</dim> </port> </output> </layer> <layer id="39" name="Constant_450" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="2" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="40" name="Constant_452" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635432" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="41" name="Constant_454" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="42" name="__module.model.model.layers.0.self_attn/aten::slice/Reshape" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635448" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="43" name="__module.model.model.layers.0.self_attn/aten::slice/Slice" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>9216</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="383,query_states.1"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="44" name="Constant_96587" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="56635456" size="32" /> <rt_info> <attribute name="precise" version="0" /> </rt_info> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="45" name="__module.model.model.layers.0.self_attn/aten::view/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="387"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> </output> </layer> <layer id="46" name="__module.model.model.layers.0.self_attn/aten::transpose/Constant" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="56635488" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="47" name="__module.model.model.layers.0.self_attn/aten::transpose/Transpose" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="388,q.1"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="48" name="__module.model.model.layers.0.self_attn.rotary_emb/aten::unsqueeze/Unsqueeze_1_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 48, 1" offset="56635504" size="96" /> <output> <port id="0" precision="FP16" names="411,412"> <dim>1</dim> <dim>48</dim> <dim>1</dim> </port> </output> </layer> <layer id="49" name="__module.model.model.layers.0.self_attn.rotary_emb/aten::unsqueeze/Unsqueeze_1" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>48</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>48</dim> <dim>1</dim> </port> </output> </layer> <layer id="50" name="ShapeOf_93877" type="ShapeOf" version="opset3"> <data output_type="i64" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="I64"> <dim>3</dim> </port> </output> </layer> <layer id="51" name="Constant_93878" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="2" size="8" /> <rt_info> <attribute name="precise" version="0" /> </rt_info> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="52" name="Constant_93879" type="Const" version="opset1"> <data element_type="i64" shape="" offset="2" size="8" /> <rt_info> <attribute name="precise" version="0" /> </rt_info> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="53" name="Gather_93880" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="I64"> <dim>3</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="I64" names="1060,1221,1382,1543,1704,1865,2026,2187,2348,2509,2670,2831,2992,311,3153,3314,345,3475,3636,3797,3958,4119,413,4280,4441,4602,4763,4924,5085,5246,5407,577,738,899"> <dim>1</dim> </port> </output> </layer> <layer id="54" name="Constant_80046" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <rt_info> <attribute name="precise" version="0" /> </rt_info> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="55" name="Constant_80048" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <rt_info> <attribute name="precise" version="0" /> </rt_info> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="56" name="__module.model.model.layers.0.self_attn.rotary_emb/prim::ListConstruct" type="Concat" version="opset1"> <data axis="0" /> <input> <port id="0" precision="I64"> <dim>1</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="3" precision="I64"> <dim>3</dim> </port> </output> </layer> <layer id="57" name="__module.model.model.layers.0.self_attn.rotary_emb/aten::expand/Broadcast" type="Broadcast" version="opset3"> <data mode="bidirectional" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>48</dim> <dim>1</dim> </port> <port id="1" precision="I64"> <dim>3</dim> </port> </input> <output> <port id="2" precision="FP32" names="1062,1067,1223,1228,1384,1389,1545,1550,1706,1711,1867,1872,2028,2033,2189,2194,2350,2355,2511,2516,2672,2677,2833,2838,2994,2999,3155,3160,3316,3321,3477,3482,3638,3643,3799,3804,3960,3965,4121,4126,415,420,4282,4287,4443,4448,4604,4609,4765,4770,4926,4931,5087,5092,5248,5253,5409,5414,579,584,740,745,901,906,inv_freq_expanded,inv_freq_expanded.1,inv_freq_expanded.101,inv_freq_expanded.103,inv_freq_expanded.105,inv_freq_expanded.107,inv_freq_expanded.109,inv_freq_expanded.11,inv_freq_expanded.111,inv_freq_expanded.113,inv_freq_expanded.115,inv_freq_expanded.117,inv_freq_expanded.119,inv_freq_expanded.121,inv_freq_expanded.123,inv_freq_expanded.125,inv_freq_expanded.13,inv_freq_expanded.15,inv_freq_expanded.17,inv_freq_expanded.19,inv_freq_expanded.21,inv_freq_expanded.23,inv_freq_expanded.25,inv_freq_expanded.27,inv_freq_expanded.29,inv_freq_expanded.3,inv_freq_expanded.31,inv_freq_expanded.33,inv_freq_expanded.35,inv_freq_expanded.37,inv_freq_expanded.39,inv_freq_expanded.41,inv_freq_expanded.43,inv_freq_expanded.45,inv_freq_expanded.47,inv_freq_expanded.49,inv_freq_expanded.5,inv_freq_expanded.51,inv_freq_expanded.53,inv_freq_expanded.55,inv_freq_expanded.57,inv_freq_expanded.59,inv_freq_expanded.61,inv_freq_expanded.63,inv_freq_expanded.65,inv_freq_expanded.67,inv_freq_expanded.69,inv_freq_expanded.7,inv_freq_expanded.71,inv_freq_expanded.73,inv_freq_expanded.75,inv_freq_expanded.77,inv_freq_expanded.79,inv_freq_expanded.81,inv_freq_expanded.83,inv_freq_expanded.85,inv_freq_expanded.87,inv_freq_expanded.89,inv_freq_expanded.9,inv_freq_expanded.91,inv_freq_expanded.93,inv_freq_expanded.95,inv_freq_expanded.97,inv_freq_expanded.99"> <dim>-1</dim> <dim>48</dim> <dim>1</dim> </port> </output> </layer> <layer id="58" name="Constant_96586" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="56635600" size="16" /> <rt_info> <attribute name="precise" version="0" /> </rt_info> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="59" name="__module.model.model/aten::view/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="I64"> <dim>-1</dim> <dim>-1</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="I64" names="1063,1224,1385,1546,1707,1868,2029,2190,2351,2512,2673,2834,2995,308,309,3156,3317,3478,3639,3800,3961,4122,416,4283,4444,4605,4766,4927,5088,5249,5410,580,741,902,position_ids"> <dim>-1</dim> <dim>-1</dim> </port> </output> </layer> <layer id="60" name="202" type="Const" version="opset1"> <data element_type="i64" shape="" offset="56635440" size="8" /> <output> <port id="0" precision="I64" names="202" /> </output> </layer> <layer id="61" name="__module.model.model.layers.0.self_attn.rotary_emb/aten::unsqueeze/Unsqueeze_2" type="Unsqueeze" version="opset1"> <input> <port id="0" precision="I64"> <dim>-1</dim> <dim>-1</dim> </port> <port id="1" precision="I64" /> </input> <output> <port id="2" precision="I64" names="1064,1065,1225,1226,1386,1387,1547,1548,1708,1709,1869,1870,2030,2031,2191,2192,2352,2353,2513,2514,2674,2675,2835,2836,2996,2997,3157,3158,3318,3319,3479,3480,3640,3641,3801,3802,3962,3963,4123,4124,417,418,4284,4285,4445,4446,4606,4607,4767,4768,4928,4929,5089,5090,5250,5251,5411,5412,581,582,742,743,903,904"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> </port> </output> </layer> <layer id="62" name="__module.model.model.layers.0.self_attn.rotary_emb/aten::to/Convert_4" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="I64"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> </port> </input> <output> <port id="1" precision="FP32" names="1066,1068,1227,1229,1388,1390,1549,1551,1710,1712,1871,1873,2032,2034,2193,2195,2354,2356,2515,2517,2676,2678,2837,2839,2998,3000,3159,3161,3320,3322,3481,3483,3642,3644,3803,3805,3964,3966,4125,4127,419,421,4286,4288,4447,4449,4608,4610,4769,4771,4930,4932,5091,5093,5252,5254,5413,5415,583,585,744,746,905,907,position_ids_expanded,position_ids_expanded.1,position_ids_expanded.101,position_ids_expanded.103,position_ids_expanded.105,position_ids_expanded.107,position_ids_expanded.109,position_ids_expanded.11,position_ids_expanded.111,position_ids_expanded.113,position_ids_expanded.115,position_ids_expanded.117,position_ids_expanded.119,position_ids_expanded.121,position_ids_expanded.123,position_ids_expanded.125,position_ids_expanded.13,position_ids_expanded.15,position_ids_expanded.17,position_ids_expanded.19,position_ids_expanded.21,position_ids_expanded.23,position_ids_expanded.25,position_ids_expanded.27,position_ids_expanded.29,position_ids_expanded.3,position_ids_expanded.31,position_ids_expanded.33,position_ids_expanded.35,position_ids_expanded.37,position_ids_expanded.39,position_ids_expanded.41,position_ids_expanded.43,position_ids_expanded.45,position_ids_expanded.47,position_ids_expanded.49,position_ids_expanded.5,position_ids_expanded.51,position_ids_expanded.53,position_ids_expanded.55,position_ids_expanded.57,position_ids_expanded.59,position_ids_expanded.61,position_ids_expanded.63,position_ids_expanded.65,position_ids_expanded.67,position_ids_expanded.69,position_ids_expanded.7,position_ids_expanded.71,position_ids_expanded.73,position_ids_expanded.75,position_ids_expanded.77,position_ids_expanded.79,position_ids_expanded.81,position_ids_expanded.83,position_ids_expanded.85,position_ids_expanded.87,position_ids_expanded.89,position_ids_expanded.9,position_ids_expanded.91,position_ids_expanded.93,position_ids_expanded.95,position_ids_expanded.97,position_ids_expanded.99"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> </port> </output> </layer> <layer id="63" name="__module.model.model.layers.0.self_attn.rotary_emb/aten::matmul/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="false" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>48</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> </port> </input> <output> <port id="2" precision="FP32" names="1069,1230,1391,1552,1713,1874,2035,2196,2357,2518,2679,2840,3001,3162,3323,3484,3645,3806,3967,4128,422,4289,4450,4611,4772,4933,5094,5255,5416,586,747,908"> <dim>-1</dim> <dim>48</dim> <dim>-1</dim> </port> </output> </layer> <layer id="64" name="__module.model.model.layers.0.self_attn.rotary_emb/aten::transpose/Constant" type="Const" version="opset1"> <data element_type="i32" shape="3" offset="56635616" size="12" /> <output> <port id="0" precision="I32"> <dim>3</dim> </port> </output> </layer> <layer id="65" name="__module.model.model.layers.0.self_attn.rotary_emb/aten::transpose/Transpose" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>48</dim> <dim>-1</dim> </port> <port id="1" precision="I32"> <dim>3</dim> </port> </input> <output> <port id="2" precision="FP32" names="1070,1231,1392,1553,1714,1875,2036,2197,2358,2519,2680,2841,3002,3163,3324,3485,3646,3807,3968,4129,423,4290,4451,4612,4773,4934,5095,5256,5417,587,748,909"> <dim>-1</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="66" name="__module.model.model.layers.0.self_attn.rotary_emb/aten::cat/Concat" type="Concat" version="opset1"> <data axis="-1" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>48</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>48</dim> </port> </input> <output> <port id="2" precision="FP32" names="1072,1233,1394,1555,1716,1877,2038,2199,2360,2521,2682,2843,3004,3165,3326,3487,3648,3809,3970,4131,425,4292,4453,4614,4775,4936,5097,5258,5419,589,750,911,emb,emb.1,emb.11,emb.13,emb.15,emb.17,emb.19,emb.21,emb.23,emb.25,emb.27,emb.29,emb.3,emb.31,emb.33,emb.35,emb.37,emb.39,emb.41,emb.43,emb.45,emb.47,emb.49,emb.5,emb.51,emb.53,emb.55,emb.57,emb.59,emb.61,emb.7,emb.9"> <dim>-1</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="67" name="__module.model.model.layers.0.self_attn.rotary_emb/aten::cos/Cos" type="Cos" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="1" precision="FP32" names="1073,1234,1395,1556,1717,1878,2039,2200,2361,2522,2683,2844,3005,3166,3327,3488,3649,3810,3971,4132,426,4293,4454,4615,4776,4937,5098,5259,5420,590,751,912"> <dim>-1</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="68" name="Constant_90032_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="56635628" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="69" name="Constant_90032" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="70" name="__module.model.model.layers.0.self_attn.rotary_emb/aten::mul/Multiply_2" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="1074,1077,1080,1235,1238,1241,1396,1399,1402,1557,1560,1563,1718,1721,1724,1879,1882,1885,2040,2043,2046,2201,2204,2207,2362,2365,2368,2523,2526,2529,2684,2687,2690,2845,2848,2851,3006,3009,3012,3167,3170,3173,3328,3331,3334,3489,3492,3495,3650,3653,3656,3811,3814,3817,3972,3975,3978,4133,4136,4139,427,4294,4297,430,4300,433,4455,4458,4461,4616,4619,4622,4777,4780,4783,4938,4941,4944,5099,5102,5105,5260,5263,5266,5421,5424,5427,591,594,597,752,755,758,913,916,919,cos.1,cos.103,cos.105,cos.109,cos.111,cos.115,cos.117,cos.121,cos.123,cos.127,cos.129,cos.13,cos.133,cos.135,cos.139,cos.141,cos.145,cos.147,cos.15,cos.151,cos.153,cos.157,cos.159,cos.163,cos.165,cos.169,cos.171,cos.175,cos.177,cos.181,cos.183,cos.187,cos.189,cos.19,cos.21,cos.25,cos.27,cos.3,cos.31,cos.33,cos.37,cos.39,cos.43,cos.45,cos.49,cos.51,cos.55,cos.57,cos.61,cos.63,cos.67,cos.69,cos.7,cos.73,cos.75,cos.79,cos.81,cos.85,cos.87,cos.9,cos.91,cos.93,cos.97,cos.99"> <dim>-1</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="71" name="__module.model.model.layers.0.self_attn/aten::unsqueeze/Unsqueeze" type="Unsqueeze" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I64" /> </input> <output> <port id="2" precision="FP32" names="1082,1243,1404,1565,1726,1887,2048,2209,2370,2531,2692,2853,3014,3175,3336,3497,3658,3819,3980,4141,4302,435,4463,4624,4785,4946,5107,5268,5429,599,760,921,cos,cos.101,cos.107,cos.11,cos.113,cos.119,cos.125,cos.131,cos.137,cos.143,cos.149,cos.155,cos.161,cos.167,cos.17,cos.173,cos.179,cos.185,cos.23,cos.29,cos.35,cos.41,cos.47,cos.5,cos.53,cos.59,cos.65,cos.71,cos.77,cos.83,cos.89,cos.95"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="72" name="__module.model.model.layers.0.self_attn/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="437"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="73" name="Constant_1017" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635630" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="74" name="Constant_1019" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635638" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="75" name="Constant_1021" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="76" name="__module.model.model.layers.0.self_attn/aten::slice/Reshape_1" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635646" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="77" name="__module.model.model.layers.0.self_attn/aten::slice/Slice_1" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="447,x2.1"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="78" name="Constant_90033_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1, 1" offset="56635654" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="79" name="Constant_90033" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="80" name="__module.model.model.layers.0.self_attn/aten::neg/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="448"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="81" name="Constant_914" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="2" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="82" name="Constant_958" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635630" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="83" name="Constant_960" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="84" name="__module.model.model.layers.0.self_attn/aten::slice/Slice_2" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="442"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="85" name="__module.model.model.layers.0.self_attn/aten::cat/Concat" type="Concat" version="opset1"> <data axis="-1" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </input> <output> <port id="2" precision="FP32" names="450"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="86" name="__module.model.model.layers.0.self_attn.rotary_emb/aten::sin/Sin" type="Sin" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="1" precision="FP32" names="1075,1236,1397,1558,1719,1880,2041,2202,2363,2524,2685,2846,3007,3168,3329,3490,3651,3812,3973,4134,428,4295,4456,4617,4778,4939,5100,5261,5422,592,753,914"> <dim>-1</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="87" name="Constant_90034_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="56635628" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="88" name="Constant_90034" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="89" name="__module.model.model.layers.0.self_attn.rotary_emb/aten::mul/Multiply_3" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="1076,1078,1081,1237,1239,1242,1398,1400,1403,1559,1561,1564,1720,1722,1725,1881,1883,1886,2042,2044,2047,2203,2205,2208,2364,2366,2369,2525,2527,2530,2686,2688,2691,2847,2849,2852,3008,3010,3013,3169,3171,3174,3330,3332,3335,3491,3493,3496,3652,3654,3657,3813,3815,3818,3974,3976,3979,4135,4137,4140,429,4296,4298,4301,431,434,4457,4459,4462,4618,4620,4623,4779,4781,4784,4940,4942,4945,5101,5103,5106,5262,5264,5267,5423,5425,5428,593,595,598,754,756,759,915,917,920,sin.1,sin.103,sin.105,sin.109,sin.111,sin.115,sin.117,sin.121,sin.123,sin.127,sin.129,sin.13,sin.133,sin.135,sin.139,sin.141,sin.145,sin.147,sin.15,sin.151,sin.153,sin.157,sin.159,sin.163,sin.165,sin.169,sin.171,sin.175,sin.177,sin.181,sin.183,sin.187,sin.189,sin.19,sin.21,sin.25,sin.27,sin.3,sin.31,sin.33,sin.37,sin.39,sin.43,sin.45,sin.49,sin.51,sin.55,sin.57,sin.61,sin.63,sin.67,sin.69,sin.7,sin.73,sin.75,sin.79,sin.81,sin.85,sin.87,sin.9,sin.91,sin.93,sin.97,sin.99"> <dim>-1</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="90" name="__module.model.model.layers.0.self_attn/aten::unsqueeze/Unsqueeze_1" type="Unsqueeze" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I64" /> </input> <output> <port id="2" precision="FP32" names="1083,1244,1405,1566,1727,1888,2049,2210,2371,2532,2693,2854,3015,3176,3337,3498,3659,3820,3981,4142,4303,436,4464,4625,4786,4947,5108,5269,5430,600,761,922,sin,sin.101,sin.107,sin.11,sin.113,sin.119,sin.125,sin.131,sin.137,sin.143,sin.149,sin.155,sin.161,sin.167,sin.17,sin.173,sin.179,sin.185,sin.23,sin.29,sin.35,sin.41,sin.47,sin.5,sin.53,sin.59,sin.65,sin.71,sin.77,sin.83,sin.89,sin.95"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="91" name="__module.model.model.layers.0.self_attn/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="451"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="92" name="__module.model.model.layers.0.self_attn/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="452"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="93" name="Constant_102206_compressed" type="Const" version="opset1"> <data element_type="f16" shape="" offset="0" size="2" /> <output> <port id="0" precision="FP16" /> </output> </layer> <layer id="94" name="Constant_102206" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16" /> </input> <output> <port id="1" precision="FP32" /> </output> </layer> <layer id="95" name="Constant_102199" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="10" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="96" name="Constant_102201" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="2" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="97" name="Constant_102203" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="18" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="98" name="Concat_102204" type="Concat" version="opset1"> <data axis="0" /> <input> <port id="0" precision="I64"> <dim>1</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="4" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="99" name="Broadcast_102207" type="Broadcast" version="opset3"> <data mode="numpy" /> <input> <port id="0" precision="FP32" /> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>0</dim> <dim>96</dim> </port> </output> </layer> <layer id="100" name="ReadValue_101047" type="ReadValue" version="opset6"> <data variable_id="past_key_values.0.keypresent.0.key" variable_type="f32" variable_shape="?,32,?,96" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>0</dim> <dim>96</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.0.key"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="101" name="Constant_99851" type="Const" version="opset1"> <data element_type="i64" shape="" offset="2" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="102" name="Gather_99852" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="103" name="Constant_460" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635432" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="104" name="Constant_462" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635656" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="105" name="Constant_464" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="106" name="__module.model.model.layers.0.self_attn/aten::slice/Slice_3" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>9216</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="384,key_states.3"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="107" name="Constant_96588" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="56635456" size="32" /> <rt_info> <attribute name="precise" version="0" /> </rt_info> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="108" name="__module.model.model.layers.0.self_attn/aten::view/Reshape_1" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="390"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> </output> </layer> <layer id="109" name="__module.model.model.layers.0.self_attn/aten::transpose/Constant_1" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="56635488" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="110" name="__module.model.model.layers.0.self_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="391,key_states.5"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="111" name="__module.model.model.layers.0.self_attn/aten::mul/Multiply_2" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="453"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="112" name="Constant_1160" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635630" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="113" name="Constant_1162" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635638" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="114" name="Constant_1164" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="115" name="__module.model.model.layers.0.self_attn/aten::slice/Slice_4" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="463,x2.3"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="116" name="Constant_90035_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1, 1" offset="56635654" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="117" name="Constant_90035" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="118" name="__module.model.model.layers.0.self_attn/aten::neg/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="464"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="119" name="Constant_1057" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="2" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="120" name="Constant_1101" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635630" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="121" name="Constant_1103" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="122" name="__module.model.model.layers.0.self_attn/aten::slice/Slice_5" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="458"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="123" name="__module.model.model.layers.0.self_attn/aten::cat/Concat_1" type="Concat" version="opset1"> <data axis="-1" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </input> <output> <port id="2" precision="FP32" names="466"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="124" name="__module.model.model.layers.0.self_attn/aten::mul/Multiply_3" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="467"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="125" name="__module.model.model.layers.0.self_attn/aten::add/Add_1" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="468,key_states.7"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="126" name="__module.model.model.layers.0.self_attn/aten::cat/Concat_2" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="hidden_states.9,present.0.key"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="127" name="Constant_102218_compressed" type="Const" version="opset1"> <data element_type="f16" shape="" offset="0" size="2" /> <output> <port id="0" precision="FP16" /> </output> </layer> <layer id="128" name="Constant_102218" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16" /> </input> <output> <port id="1" precision="FP32" /> </output> </layer> <layer id="129" name="Constant_102211" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="10" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="130" name="Constant_102213" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="2" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="131" name="Constant_102215" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="18" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="132" name="Concat_102216" type="Concat" version="opset1"> <data axis="0" /> <input> <port id="0" precision="I64"> <dim>1</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="4" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="133" name="Broadcast_102219" type="Broadcast" version="opset3"> <data mode="numpy" /> <input> <port id="0" precision="FP32" /> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>0</dim> <dim>96</dim> </port> </output> </layer> <layer id="134" name="ReadValue_101049" type="ReadValue" version="opset6"> <data variable_id="past_key_values.0.valuepresent.0.value" variable_type="f32" variable_shape="?,32,?,96" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>0</dim> <dim>96</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.0.value"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="135" name="Constant_99854" type="Const" version="opset1"> <data element_type="i64" shape="" offset="2" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="136" name="Gather_99855" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="137" name="Constant_470" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635656" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="138" name="Constant_472" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635638" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="139" name="Constant_474" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="140" name="__module.model.model.layers.0.self_attn/aten::slice/Slice_6" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>9216</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="385,value_states.1"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="141" name="Constant_96589" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="56635456" size="32" /> <rt_info> <attribute name="precise" version="0" /> </rt_info> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="142" name="__module.model.model.layers.0.self_attn/aten::view/Reshape_2" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="393"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> </output> </layer> <layer id="143" name="__module.model.model.layers.0.self_attn/aten::transpose/Constant_2" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="56635488" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="144" name="__module.model.model.layers.0.self_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="394"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="145" name="__module.model.model.layers.0.self_attn/aten::cat/Concat_3" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="hidden_states.11,present.0.value"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="146" name="Constant_90037_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1, 1" offset="12314" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="147" name="Constant_90037" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="148" name="__module.model.model/aten::unsqueeze/Unsqueeze" type="Unsqueeze" version="opset1"> <input> <port id="0" precision="I64"> <dim>-1</dim> <dim>-1</dim> </port> <port id="1" precision="I64" /> </input> <output> <port id="2" precision="I64" names="348"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> </port> </output> </layer> <layer id="149" name="203" type="Const" version="opset1"> <data element_type="i64" shape="" offset="56635448" size="8" /> <output> <port id="0" precision="I64" names="203" /> </output> </layer> <layer id="150" name="__module.model.model/aten::unsqueeze/Unsqueeze_1" type="Unsqueeze" version="opset1"> <input> <port id="0" precision="I64"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> </port> <port id="1" precision="I64" /> </input> <output> <port id="2" precision="I64" names="349,350"> <dim>-1</dim> <dim>1</dim> <dim>1</dim> <dim>-1</dim> </port> </output> </layer> <layer id="151" name="Constant_80054" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <rt_info> <attribute name="precise" version="0" /> </rt_info> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="152" name="Constant_93868" type="Const" version="opset1"> <data element_type="i64" shape="" offset="56635440" size="8" /> <rt_info> <attribute name="precise" version="0" /> </rt_info> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="153" name="Constant_93869" type="Const" version="opset1"> <data element_type="i64" shape="" offset="2" size="8" /> <rt_info> <attribute name="precise" version="0" /> </rt_info> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="154" name="Gather_93870" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="I64"> <dim>3</dim> </port> <port id="1" precision="I64" /> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="I64" names="300,316,319" /> </output> </layer> <layer id="155" name="Constant_93871" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <rt_info> <attribute name="precise" version="0" /> </rt_info> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="156" name="Reshape_93872" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="I64" /> <port id="1" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="2" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="157" name="ShapeOf_93891" type="ShapeOf" version="opset3"> <data output_type="i64" /> <input> <port id="0" precision="I64"> <dim>-1</dim> <dim>-1</dim> </port> </input> <output> <port id="1" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="158" name="Constant_93892" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <rt_info> <attribute name="precise" version="0" /> </rt_info> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="159" name="Constant_93893" type="Const" version="opset1"> <data element_type="i64" shape="" offset="2" size="8" /> <rt_info> <attribute name="precise" version="0" /> </rt_info> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="160" name="Gather_93894" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="I64"> <dim>2</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="I64" names="346"> <dim>1</dim> </port> </output> </layer> <layer id="161" name="__module.model.model/prim::ListConstruct_1" type="Concat" version="opset1"> <data axis="0" /> <input> <port id="0" precision="I64"> <dim>1</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="4" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="162" name="__module.model.model/aten::expand/Broadcast" type="Broadcast" version="opset3"> <data mode="bidirectional" /> <input> <port id="0" precision="I64"> <dim>-1</dim> <dim>1</dim> <dim>1</dim> <dim>-1</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="I64" names="352"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>-1</dim> </port> </output> </layer> <layer id="163" name="__module.model.model/aten::to/Convert_1" type="Convert" version="opset1"> <data destination_type="f32" /> <input> <port id="0" precision="I64"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>-1</dim> </port> </input> <output> <port id="1" precision="FP32" names="353"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>-1</dim> </port> </output> </layer> <layer id="164" name="Constant_90036_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1, 1" offset="12314" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="165" name="Constant_90036" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="166" name="__module.model.model/aten::rsub/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>-1</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>-1</dim> </port> </output> </layer> <layer id="167" name="__module.model.model/aten::rsub/Subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>-1</dim> </port> </input> <output> <port id="2" precision="FP32" names="354,inverted_mask"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>-1</dim> </port> </output> </layer> <layer id="168" name="__module.model.model/aten::to/Convert_2" type="Convert" version="opset1"> <data destination_type="boolean" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>-1</dim> </port> </input> <output> <port id="1" precision="BOOL" names="355"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>-1</dim> </port> </output> </layer> <layer id="169" name="210" type="Const" version="opset1"> <data element_type="f32" shape="" offset="56635664" size="4" /> <output> <port id="0" precision="FP32" names="210" /> </output> </layer> <layer id="170" name="__module.model.model/aten::masked_fill/Select" type="Select" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="BOOL"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>-1</dim> </port> <port id="1" precision="FP32" /> <port id="2" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>-1</dim> </port> </input> <output> <port id="3" precision="FP32" names="356,357,expanded_attn_mask"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>-1</dim> </port> </output> </layer> <layer id="171" name="__module.model.model/aten::to/Convert_4" type="Convert" version="opset1"> <data destination_type="boolean" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>-1</dim> </port> </input> <output> <port id="1" precision="BOOL" names="358"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>-1</dim> </port> </output> </layer> <layer id="172" name="Constant_90039" type="Const" version="opset1"> <data element_type="i64" shape="1, 1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="173" name="__module.model.model/aten::triu/Constant" type="Const" version="opset1"> <data element_type="i32" shape="" offset="56635668" size="4" /> <output> <port id="0" precision="I32" /> </output> </layer> <layer id="174" name="__module.model.model/aten::zeros/Constant_compressed" type="Const" version="opset1"> <data element_type="f16" shape="" offset="0" size="2" /> <output> <port id="0" precision="FP16" /> </output> </layer> <layer id="175" name="__module.model.model/aten::zeros/Constant" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16" /> </input> <output> <port id="1" precision="FP32" /> </output> </layer> <layer id="176" name="ShapeOf_93899" type="ShapeOf" version="opset3"> <data output_type="i64" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="1" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="177" name="Constant_93900" type="Const" version="opset1"> <data element_type="i64" shape="" offset="56635448" size="8" /> <rt_info> <attribute name="precise" version="0" /> </rt_info> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="178" name="Constant_93901" type="Const" version="opset1"> <data element_type="i64" shape="" offset="2" size="8" /> <rt_info> <attribute name="precise" version="0" /> </rt_info> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="179" name="Gather_93902" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="I64"> <dim>4</dim> </port> <port id="1" precision="I64" /> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="I64" names="305" /> </output> </layer> <layer id="180" name="__module.model.model/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="I64" /> <port id="1" precision="I64" /> </input> <output> <port id="2" precision="I64" names="310,key_value_length" /> </output> </layer> <layer id="181" name="__module.model.model/aten::sub/Subtract" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="I64" /> <port id="1" precision="I64" /> </input> <output> <port id="2" precision="I64" names="312,313,past_key_values_length" /> </output> </layer> <layer id="182" name="Constant_223" type="Const" version="opset1"> <data element_type="i32" shape="" offset="56635668" size="4" /> <rt_info> <attribute name="precise" version="0" /> </rt_info> <output> <port id="0" precision="I32" /> </output> </layer> <layer id="183" name="Unsqueeze_224" type="Unsqueeze" version="opset1"> <input> <port id="0" precision="I64" /> <port id="1" precision="I32" /> </input> <output> <port id="2" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="184" name="__module.model.model/prim::ListConstruct_2" type="Concat" version="opset1"> <data axis="0" /> <input> <port id="0" precision="I64"> <dim>1</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="2" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="185" name="__module.model.model/aten::zeros/Broadcast" type="Broadcast" version="opset3"> <data mode="numpy" /> <input> <port id="0" precision="FP32" /> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP32" names="326"> <dim>-1</dim> <dim>-1</dim> </port> </output> </layer> <layer id="186" name="ShapeOf_93917" type="ShapeOf" version="opset3"> <data output_type="i32" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> </port> </input> <output> <port id="1" precision="I32"> <dim>2</dim> </port> </output> </layer> <layer id="187" name="Constant_93918" type="Const" version="opset1"> <data element_type="i64" shape="" offset="56635440" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="188" name="Constant_93919" type="Const" version="opset1"> <data element_type="i64" shape="" offset="2" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="189" name="Gather_93920" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="I32"> <dim>2</dim> </port> <port id="1" precision="I64" /> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="I32" /> </output> </layer> <layer id="190" name="Convert_93921" type="Convert" version="opset1"> <data destination_type="i32" /> <input> <port id="0" precision="I64" /> </input> <output> <port id="1" precision="I32" /> </output> </layer> <layer id="191" name="Add_93922" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="I32" /> <port id="1" precision="I32" /> </input> <output> <port id="2" precision="I32" /> </output> </layer> <layer id="192" name="__module.model.model/aten::triu/Constant_2" type="Const" version="opset1"> <data element_type="i32" shape="" offset="56635672" size="4" /> <output> <port id="0" precision="I32" /> </output> </layer> <layer id="193" name="__module.model.model/aten::triu/Range" type="Range" version="opset4"> <data output_type="i32" /> <input> <port id="0" precision="I32" /> <port id="1" precision="I32" /> <port id="2" precision="I32" /> </input> <output> <port id="3" precision="I32"> <dim>-1</dim> </port> </output> </layer> <layer id="194" name="__module.model.model/aten::triu/Unsqueeze" type="Unsqueeze" version="opset1"> <input> <port id="0" precision="I32"> <dim>-1</dim> </port> <port id="1" precision="I32" /> </input> <output> <port id="2" precision="I32"> <dim>1</dim> <dim>-1</dim> </port> </output> </layer> <layer id="195" name="Constant_88958" type="Const" version="opset1"> <data element_type="i64" shape="" offset="56635676" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="196" name="__module.model.model/aten::add/Add_2" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="I64" /> <port id="1" precision="I64" /> </input> <output> <port id="2" precision="I64" names="330,331" /> </output> </layer> <layer id="197" name="__module.model.model/aten::triu/Convert" type="Convert" version="opset1"> <data destination_type="i32" /> <input> <port id="0" precision="I64" /> </input> <output> <port id="1" precision="I32" /> </output> </layer> <layer id="198" name="__module.model.model/aten::triu/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="I32" /> <port id="1" precision="I32" /> </input> <output> <port id="2" precision="I32" /> </output> </layer> <layer id="199" name="__module.model.model/aten::triu/Range_1" type="Range" version="opset4"> <data output_type="i32" /> <input> <port id="0" precision="I32" /> <port id="1" precision="I32" /> <port id="2" precision="I32" /> </input> <output> <port id="3" precision="I32"> <dim>-1</dim> </port> </output> </layer> <layer id="200" name="__module.model.model/aten::triu/Unsqueeze_1" type="Unsqueeze" version="opset1"> <input> <port id="0" precision="I32"> <dim>-1</dim> </port> <port id="1" precision="I32" /> </input> <output> <port id="2" precision="I32"> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="201" name="__module.model.model/aten::triu/GreaterEqual" type="GreaterEqual" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="I32"> <dim>1</dim> <dim>-1</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="BOOL"> <dim>-1</dim> <dim>-1</dim> </port> </output> </layer> <layer id="202" name="__module.model.model/aten::ones_like/Convert" type="Const" version="opset1"> <data element_type="i64" shape="" offset="56635440" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="203" name="__module.model.model/aten::arange/Constant" type="Const" version="opset1"> <data element_type="i32" shape="" offset="56635668" size="4" /> <output> <port id="0" precision="I32" /> </output> </layer> <layer id="204" name="__module.model.model/aten::arange/Constant_1" type="Const" version="opset1"> <data element_type="i32" shape="" offset="56635672" size="4" /> <output> <port id="0" precision="I32" /> </output> </layer> <layer id="205" name="__module.model.model/aten::arange/Range" type="Range" version="opset4"> <data output_type="f32" /> <input> <port id="0" precision="I32" /> <port id="1" precision="I64" /> <port id="2" precision="I32" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> </port> </output> </layer> <layer id="206" name="__module.model.model/aten::arange/ConvertLike" type="Convert" version="opset1"> <data destination_type="i64" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> </port> </input> <output> <port id="1" precision="I64" names="317,mask_cond"> <dim>-1</dim> </port> </output> </layer> <layer id="207" name="Constant_90038" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="208" name="__module.model.model/aten::add/Add_1" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="I64"> <dim>-1</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="2" precision="I64" names="318"> <dim>-1</dim> </port> </output> </layer> <layer id="209" name="Constant_96590" type="Const" version="opset1"> <data element_type="i64" shape="2" offset="56635684" size="16" /> <rt_info> <attribute name="precise" version="0" /> </rt_info> <output> <port id="0" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="210" name="__module.model.model/aten::view/Reshape_1" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="I64"> <dim>-1</dim> </port> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="I64" names="321"> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="211" name="__module.model.model/aten::lt/Less" type="Less" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="I64"> <dim>-1</dim> </port> <port id="1" precision="I64"> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="BOOL" names="322"> <dim>-1</dim> <dim>-1</dim> </port> </output> </layer> <layer id="212" name="__module.model.model/aten::masked_fill_/ConvertLike_compressed" type="Const" version="opset1"> <data element_type="f16" shape="" offset="0" size="2" /> <output> <port id="0" precision="FP16" /> </output> </layer> <layer id="213" name="__module.model.model/aten::masked_fill_/ConvertLike" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16" /> </input> <output> <port id="1" precision="FP32" /> </output> </layer> <layer id="214" name="Constant_86585" type="Const" version="opset1"> <data element_type="i32" shape="1" offset="56635700" size="4" /> <rt_info> <attribute name="precise" version="0" /> </rt_info> <output> <port id="0" precision="I32"> <dim>1</dim> </port> </output> </layer> <layer id="215" name="__module.model.model/prim::ListConstruct_3" type="Broadcast" version="opset3"> <data mode="numpy" /> <input> <port id="0" precision="I64"> <dim>1</dim> </port> <port id="1" precision="I32"> <dim>1</dim> </port> </input> <output> <port id="2" precision="I64"> <dim>2</dim> </port> </output> </layer> <layer id="216" name="__module.model.model/aten::full/Broadcast" type="Broadcast" version="opset3"> <data mode="numpy" /> <input> <port id="0" precision="FP32" /> <port id="1" precision="I64"> <dim>2</dim> </port> </input> <output> <port id="2" precision="FP32" names="315_1"> <dim>-1</dim> <dim>-1</dim> </port> </output> </layer> <layer id="217" name="__module.model.model/aten::masked_fill_/Select" type="Select" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="BOOL"> <dim>-1</dim> <dim>-1</dim> </port> <port id="1" precision="FP32" /> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> </port> </input> <output> <port id="3" precision="FP32" names="315,324,mask.1"> <dim>-1</dim> <dim>-1</dim> </port> </output> </layer> <layer id="218" name="__module.model.model/aten::cat/Concat" type="Concat" version="opset1"> <data axis="-1" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> </port> </input> <output> <port id="2" precision="FP32" names="328_1"> <dim>-1</dim> <dim>-1</dim> </port> </output> </layer> <layer id="219" name="__module.model.model/aten::ones_like/ShapeOf" type="ShapeOf" version="opset3"> <data output_type="i32" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> </port> </input> <output> <port id="1" precision="I32"> <dim>2</dim> </port> </output> </layer> <layer id="220" name="__module.model.model/aten::ones_like/Broadcast" type="Broadcast" version="opset3"> <data mode="numpy" /> <input> <port id="0" precision="I64" /> <port id="1" precision="I32"> <dim>2</dim> </port> </input> <output> <port id="2" precision="I64" names="332"> <dim>-1</dim> <dim>-1</dim> </port> </output> </layer> <layer id="221" name="__module.model.model/aten::triu/ConvertLike" type="Const" version="opset1"> <data element_type="i64" shape="" offset="2" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="222" name="__module.model.model/aten::triu/Select" type="Select" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="BOOL"> <dim>-1</dim> <dim>-1</dim> </port> <port id="1" precision="I64"> <dim>-1</dim> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="I64" names="333"> <dim>-1</dim> <dim>-1</dim> </port> </output> </layer> <layer id="223" name="__module.model.model/aten::rsub/Subtract_1" type="Subtract" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="I64"> <dim>1</dim> <dim>1</dim> </port> <port id="1" precision="I64"> <dim>-1</dim> <dim>-1</dim> </port> </input> <output> <port id="2" precision="I64" names="334,context_mask"> <dim>-1</dim> <dim>-1</dim> </port> </output> </layer> <layer id="224" name="__module.model.model/aten::to/Convert_6" type="Convert" version="opset1"> <data destination_type="boolean" /> <input> <port id="0" precision="I64"> <dim>-1</dim> <dim>-1</dim> </port> </input> <output> <port id="1" precision="BOOL" names="335"> <dim>-1</dim> <dim>-1</dim> </port> </output> </layer> <layer id="225" name="__module.model.model/aten::masked_fill_/Select_1" type="Select" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="BOOL"> <dim>-1</dim> <dim>-1</dim> </port> <port id="1" precision="FP32" /> <port id="2" precision="FP32"> <dim>-1</dim> <dim>-1</dim> </port> </input> <output> <port id="3" precision="FP32" names="328,mask.5"> <dim>-1</dim> <dim>-1</dim> </port> </output> </layer> <layer id="226" name="209" type="Const" version="opset1"> <data element_type="i64" shape="" offset="2" size="8" /> <output> <port id="0" precision="I64" names="209" /> </output> </layer> <layer id="227" name="__module.model.model/aten::unsqueeze/Unsqueeze_2" type="Unsqueeze" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> </port> <port id="1" precision="I64" /> </input> <output> <port id="2" precision="FP32" names="337"> <dim>1</dim> <dim>-1</dim> <dim>-1</dim> </port> </output> </layer> <layer id="228" name="__module.model.model/aten::unsqueeze/Unsqueeze_3" type="Unsqueeze" version="opset1"> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>-1</dim> <dim>-1</dim> </port> <port id="1" precision="I64" /> </input> <output> <port id="2" precision="FP32" names="338,339,340"> <dim>1</dim> <dim>1</dim> <dim>-1</dim> <dim>-1</dim> </port> </output> </layer> <layer id="229" name="Constant_80068" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <rt_info> <attribute name="precise" version="0" /> </rt_info> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="230" name="__module.model.model/aten::add/Add_3" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="I64"> <dim>1</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="2" precision="I64" names="341,342"> <dim>1</dim> </port> </output> </layer> <layer id="231" name="__module.model.model/prim::ListConstruct_5" type="Concat" version="opset1"> <data axis="0" /> <input> <port id="0" precision="I64"> <dim>1</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="4" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="232" name="__module.model.model/aten::expand/Broadcast_1" type="Broadcast" version="opset3"> <data mode="bidirectional" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>-1</dim> <dim>-1</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="344,causal_4d_mask"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>-1</dim> </port> </output> </layer> <layer id="233" name="__module.model.model/aten::masked_fill/Select_1" type="Select" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="BOOL"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>-1</dim> </port> <port id="1" precision="FP32" /> <port id="2" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>-1</dim> </port> </input> <output> <port id="3" precision="FP32" names="1121,1122,1123,1282,1283,1284,1443,1444,1445,1604,1605,1606,1765,1766,1767,1926,1927,1928,2087,2088,2089,2248,2249,2250,2409,2410,2411,2570,2571,2572,2731,2732,2733,2892,2893,2894,3053,3054,3055,3214,3215,3216,3375,3376,3377,3536,3537,3538,359,3697,3698,3699,3858,3859,3860,4019,4020,4021,4180,4181,4182,4341,4342,4343,4502,4503,4504,4663,4664,4665,477,478,479,4824,4825,4826,4985,4986,4987,5146,5147,5148,5307,5308,5309,5468,5469,5470,638,639,640,799,800,801,960,961,962,attention_mask"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>-1</dim> </port> </output> </layer> <layer id="234" name="Constant_1234" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="2" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="235" name="Constant_94002" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <rt_info> <attribute name="precise" version="0" /> </rt_info> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="236" name="Reshape_94003" type="Reshape" version="opset1"> <data special_zero="false" /> <input> <port id="0" precision="I64" /> <port id="1" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="2" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="237" name="Add_94006" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="I64"> <dim>1</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="2" precision="I64" names="1120,1281,1442,1603,1764,1925,2086,2247,2408,2569,2730,2891,3052,3213,3374,3535,3696,3857,4018,4179,4340,4501,4662,476,4823,4984,5145,5306,5467,637,798,959"> <dim>1</dim> </port> </output> </layer> <layer id="238" name="Constant_1237" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="239" name="__module.model.model.layers.0.self_attn/aten::slice/Slice_10" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>-1</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="1124,1285,1446,1607,1768,1929,2090,2251,2412,2573,2734,2895,3056,3217,3378,3539,3700,3861,4022,4183,4344,4505,4666,480,4827,4988,5149,5310,5471,641,802,963"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>-1</dim> </port> </output> </layer> <layer id="240" name="__module.model.model.layers.0.self_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> <data causal="false" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="2" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="3" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>-1</dim> </port> </input> <output> <port id="4" precision="FP32" names="481,attn_output.1"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="241" name="__module.model.model.layers.0.self_attn/aten::transpose/Constant_3" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="56635488" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="242" name="__module.model.model.layers.0.self_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="482"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> </output> </layer> <layer id="243" name="Constant_96591" type="Const" version="opset1"> <data element_type="i64" shape="3" offset="56635704" size="24" /> <rt_info> <attribute name="precise" version="0" /> </rt_info> <output> <port id="0" precision="I64"> <dim>3</dim> </port> </output> </layer> <layer id="244" name="__module.model.model.layers.0.self_attn/aten::view/Reshape_3" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> <port id="1" precision="I64"> <dim>3</dim> </port> </input> <output> <port id="2" precision="FP32" names="485"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="245" name="self.model.model.layers.0.self_attn.o_proj.weight_compressed" type="Const" version="opset1"> <data element_type="f16" shape="3072, 3072" offset="56635728" size="18874368" /> <output> <port id="0" precision="FP16" names="self.model.model.layers.0.self_attn.o_proj.weight"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="246" name="self.model.model.layers.0.self_attn.o_proj.weight" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="247" name="__module.model.model.layers.0.self_attn.o_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="487,489,input.1"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="248" name="__module.model.model.layers.0/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="493,495,506,hidden_states.13,hidden_states.15"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="249" name="Constant_90043_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 3072" offset="75510096" size="6144" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="250" name="Constant_90043" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="251" name="Constant_90042_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12314" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="252" name="Constant_90042" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="253" name="Constant_90040_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12316" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="254" name="Constant_90040" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="255" name="__module.model.model.layers.0.post_attention_layernorm/aten::pow/Power" type="Power" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="496"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="256" name="Constant_1338" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="12318" size="8" /> <output> <port id="0" precision="I64" names="497"> <dim>1</dim> </port> </output> </layer> <layer id="257" name="__module.model.model.layers.0.post_attention_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> <data keep_dims="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="498,variance.3"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="258" name="Constant_90041_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12326" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="259" name="Constant_90041" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="260" name="__module.model.model.layers.0.post_attention_layernorm/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="499"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="261" name="__module.model.model.layers.0.post_attention_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="262" name="__module.model.model.layers.0.post_attention_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> <data auto_broadcast="numpy" m_pythondiv="true" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="500"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="263" name="__module.model.model.layers.0.post_attention_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="501,502,hidden_states.17,hidden_states.19"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="264" name="__module.model.model.layers.0.post_attention_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="503,505"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="265" name="self.model.model.layers.0.mlp.gate_up_proj.weight_compressed" type="Const" version="opset1"> <data element_type="f16" shape="16384, 3072" offset="75516240" size="100663296" /> <output> <port id="0" precision="FP16" names="self.model.model.layers.0.mlp.gate_up_proj.weight"> <dim>16384</dim> <dim>3072</dim> </port> </output> </layer> <layer id="266" name="self.model.model.layers.0.mlp.gate_up_proj.weight" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>16384</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>16384</dim> <dim>3072</dim> </port> </output> </layer> <layer id="267" name="__module.model.model.layers.0.mlp.gate_up_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>16384</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="510,up_states.1"> <dim>-1</dim> <dim>-1</dim> <dim>16384</dim> </port> </output> </layer> <layer id="268" name="205" type="Const" version="opset1"> <data element_type="i64" shape="" offset="12318" size="8" /> <output> <port id="0" precision="I64" names="205" /> </output> </layer> <layer id="269" name="__module.model.model.layers.0.mlp/prim::ListUnpack/ShapeOf" type="ShapeOf" version="opset3"> <data output_type="i32" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16384</dim> </port> </input> <output> <port id="1" precision="I32"> <dim>3</dim> </port> </output> </layer> <layer id="270" name="Constant_35107" type="Const" version="opset1"> <data element_type="i32" shape="1" offset="56635668" size="4" /> <output> <port id="0" precision="I32"> <dim>1</dim> </port> </output> </layer> <layer id="271" name="__module.model.model.layers.0.mlp/prim::ListUnpack/Gather" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="I32"> <dim>3</dim> </port> <port id="1" precision="I64" /> <port id="2" precision="I32"> <dim>1</dim> </port> </input> <output> <port id="3" precision="I32" /> </output> </layer> <layer id="272" name="__module.model.model.layers.0.mlp/prim::ListUnpack/Convert" type="Const" version="opset1"> <data element_type="i32" shape="" offset="56635700" size="4" /> <output> <port id="0" precision="I32" /> </output> </layer> <layer id="273" name="__module.model.model.layers.0.mlp/prim::ListUnpack/Divide" type="Divide" version="opset1"> <data auto_broadcast="numpy" m_pythondiv="true" /> <input> <port id="0" precision="I32" /> <port id="1" precision="I32" /> </input> <output> <port id="2" precision="I32" /> </output> </layer> <layer id="274" name="__module.model.model.layers.0.mlp/prim::ListUnpack/Mod" type="Mod" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="I32" /> <port id="1" precision="I32" /> </input> <output> <port id="2" precision="I32" /> </output> </layer> <layer id="275" name="__module.model.model.layers.0.mlp/prim::ListUnpack/Greater" type="Greater" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="I32" /> <port id="1" precision="I32"> <dim>1</dim> </port> </input> <output> <port id="2" precision="BOOL"> <dim>1</dim> </port> </output> </layer> <layer id="276" name="__module.model.model.layers.0.mlp/prim::ListUnpack/Convert_0" type="Convert" version="opset1"> <data destination_type="i32" /> <input> <port id="0" precision="BOOL"> <dim>1</dim> </port> </input> <output> <port id="1" precision="I32"> <dim>1</dim> </port> </output> </layer> <layer id="277" name="__module.model.model.layers.0.mlp/prim::ListUnpack/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="I32" /> <port id="1" precision="I32"> <dim>1</dim> </port> </input> <output> <port id="2" precision="I32"> <dim>1</dim> </port> </output> </layer> <layer id="278" name="Constant_35108" type="Const" version="opset1"> <data element_type="i32" shape="1" offset="176179536" size="4" /> <output> <port id="0" precision="I32"> <dim>1</dim> </port> </output> </layer> <layer id="279" name="__module.model.model.layers.0.mlp/prim::ListUnpack/Concat" type="Concat" version="opset1"> <data axis="0" /> <input> <port id="0" precision="I32"> <dim>1</dim> </port> <port id="1" precision="I32"> <dim>1</dim> </port> </input> <output> <port id="2" precision="I32"> <dim>2</dim> </port> </output> </layer> <layer id="280" name="__module.model.model.layers.0.mlp/prim::ListUnpack/VariadicSplit" type="VariadicSplit" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16384</dim> </port> <port id="1" precision="I64" /> <port id="2" precision="I32"> <dim>2</dim> </port> </input> <output> <port id="3" precision="FP32" names="512,input.3"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> <port id="4" precision="FP32" names="513,up_states.3"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> </output> </layer> <layer id="281" name="__module.model.model.layers.0.mlp.activation_fn/aten::silu/Swish" type="Swish" version="opset4"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> </input> <output> <port id="1" precision="FP32" names="514"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> </output> </layer> <layer id="282" name="__module.model.model.layers.0.mlp/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> </input> <output> <port id="2" precision="FP32" names="515"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> </output> </layer> <layer id="283" name="self.model.model.layers.0.mlp.down_proj.weight_compressed" type="Const" version="opset1"> <data element_type="f16" shape="3072, 8192" offset="176179540" size="50331648" /> <output> <port id="0" precision="FP16" names="self.model.model.layers.0.mlp.down_proj.weight"> <dim>3072</dim> <dim>8192</dim> </port> </output> </layer> <layer id="284" name="self.model.model.layers.0.mlp.down_proj.weight" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>8192</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>3072</dim> <dim>8192</dim> </port> </output> </layer> <layer id="285" name="__module.model.model.layers.0.mlp.down_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> <port id="1" precision="FP32"> <dim>3072</dim> <dim>8192</dim> </port> </input> <output> <port id="2" precision="FP32" names="517,input.5"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="286" name="__module.model.model.layers.0/aten::add/Add_1" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="519,521,529,540,hidden_states.23,hidden_states.25"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="287" name="Constant_90047_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 3072" offset="226511188" size="6144" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="288" name="Constant_90047" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="289" name="Constant_90046_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12314" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="290" name="Constant_90046" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="291" name="Constant_90044_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12316" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="292" name="Constant_90044" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="293" name="__module.model.model.layers.1.input_layernorm/aten::pow/Power" type="Power" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="530"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="294" name="Constant_1407" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="12318" size="8" /> <output> <port id="0" precision="I64" names="531"> <dim>1</dim> </port> </output> </layer> <layer id="295" name="__module.model.model.layers.1.input_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> <data keep_dims="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="532,variance.5"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="296" name="Constant_90045_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12326" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="297" name="Constant_90045" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="298" name="__module.model.model.layers.1.input_layernorm/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="533"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="299" name="__module.model.model.layers.1.input_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="300" name="__module.model.model.layers.1.input_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> <data auto_broadcast="numpy" m_pythondiv="true" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="534"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="301" name="__module.model.model.layers.1.input_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="535,536,hidden_states.27,hidden_states.29"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="302" name="__module.model.model.layers.1.input_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="537,539,hidden_states.31"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="303" name="self.model.model.layers.1.self_attn.qkv_proj.weight_compressed" type="Const" version="opset1"> <data element_type="f16" shape="9216, 3072" offset="226517332" size="56623104" /> <output> <port id="0" precision="FP16" names="self.model.model.layers.1.self_attn.qkv_proj.weight"> <dim>9216</dim> <dim>3072</dim> </port> </output> </layer> <layer id="304" name="self.model.model.layers.1.self_attn.qkv_proj.weight" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>9216</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>9216</dim> <dim>3072</dim> </port> </output> </layer> <layer id="305" name="__module.model.model.layers.1.self_attn.qkv_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>9216</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="546,qkv.3"> <dim>-1</dim> <dim>-1</dim> <dim>9216</dim> </port> </output> </layer> <layer id="306" name="Constant_1450" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="2" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="307" name="Constant_1452" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635432" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="308" name="Constant_1454" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="309" name="__module.model.model.layers.1.self_attn/aten::slice/Slice" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>9216</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="547,query_states.3"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="310" name="Constant_96592" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="56635456" size="32" /> <rt_info> <attribute name="precise" version="0" /> </rt_info> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="311" name="__module.model.model.layers.1.self_attn/aten::view/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="551"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> </output> </layer> <layer id="312" name="__module.model.model.layers.1.self_attn/aten::transpose/Constant" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="56635488" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="313" name="__module.model.model.layers.1.self_attn/aten::transpose/Transpose" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="552,q.3"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="314" name="__module.model.model.layers.1.self_attn/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="601"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="315" name="Constant_2017" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635630" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="316" name="Constant_2019" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635638" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="317" name="Constant_2021" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="318" name="__module.model.model.layers.1.self_attn/aten::slice/Slice_1" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="611,x2.5"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="319" name="Constant_90048_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1, 1" offset="56635654" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="320" name="Constant_90048" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="321" name="__module.model.model.layers.1.self_attn/aten::neg/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="612"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="322" name="Constant_1914" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="2" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="323" name="Constant_1958" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635630" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="324" name="Constant_1960" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="325" name="__module.model.model.layers.1.self_attn/aten::slice/Slice_2" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="606"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="326" name="__module.model.model.layers.1.self_attn/aten::cat/Concat" type="Concat" version="opset1"> <data axis="-1" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </input> <output> <port id="2" precision="FP32" names="614"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="327" name="__module.model.model.layers.1.self_attn/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="615"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="328" name="__module.model.model.layers.1.self_attn/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="616"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="329" name="Constant_102242_compressed" type="Const" version="opset1"> <data element_type="f16" shape="" offset="0" size="2" /> <output> <port id="0" precision="FP16" /> </output> </layer> <layer id="330" name="Constant_102242" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16" /> </input> <output> <port id="1" precision="FP32" /> </output> </layer> <layer id="331" name="Constant_102235" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="10" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="332" name="Constant_102237" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="2" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="333" name="Constant_102239" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="18" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="334" name="Concat_102240" type="Concat" version="opset1"> <data axis="0" /> <input> <port id="0" precision="I64"> <dim>1</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="4" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="335" name="Broadcast_102243" type="Broadcast" version="opset3"> <data mode="numpy" /> <input> <port id="0" precision="FP32" /> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>0</dim> <dim>96</dim> </port> </output> </layer> <layer id="336" name="ReadValue_101051" type="ReadValue" version="opset6"> <data variable_id="past_key_values.1.keypresent.1.key" variable_type="f32" variable_shape="?,32,?,96" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>0</dim> <dim>96</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.1.key"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="337" name="Constant_99857" type="Const" version="opset1"> <data element_type="i64" shape="" offset="2" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="338" name="Gather_99858" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="339" name="Constant_1460" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635432" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="340" name="Constant_1462" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635656" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="341" name="Constant_1464" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="342" name="__module.model.model.layers.1.self_attn/aten::slice/Slice_3" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>9216</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="548,key_states.9"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="343" name="Constant_96593" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="56635456" size="32" /> <rt_info> <attribute name="precise" version="0" /> </rt_info> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="344" name="__module.model.model.layers.1.self_attn/aten::view/Reshape_1" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="554"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> </output> </layer> <layer id="345" name="__module.model.model.layers.1.self_attn/aten::transpose/Constant_1" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="56635488" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="346" name="__module.model.model.layers.1.self_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="555,key_states.11"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="347" name="__module.model.model.layers.1.self_attn/aten::mul/Multiply_2" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="617"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="348" name="Constant_2160" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635630" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="349" name="Constant_2162" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635638" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="350" name="Constant_2164" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="351" name="__module.model.model.layers.1.self_attn/aten::slice/Slice_4" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="627,x2.7"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="352" name="Constant_90049_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1, 1" offset="56635654" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="353" name="Constant_90049" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="354" name="__module.model.model.layers.1.self_attn/aten::neg/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="628"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="355" name="Constant_2057" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="2" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="356" name="Constant_2101" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635630" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="357" name="Constant_2103" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="358" name="__module.model.model.layers.1.self_attn/aten::slice/Slice_5" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="622"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="359" name="__module.model.model.layers.1.self_attn/aten::cat/Concat_1" type="Concat" version="opset1"> <data axis="-1" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </input> <output> <port id="2" precision="FP32" names="630"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="360" name="__module.model.model.layers.1.self_attn/aten::mul/Multiply_3" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="631"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="361" name="__module.model.model.layers.1.self_attn/aten::add/Add_1" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="632"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="362" name="__module.model.model.layers.1.self_attn/aten::cat/Concat_2" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="hidden_states.33,present.1.key"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="363" name="Constant_102230_compressed" type="Const" version="opset1"> <data element_type="f16" shape="" offset="0" size="2" /> <output> <port id="0" precision="FP16" /> </output> </layer> <layer id="364" name="Constant_102230" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16" /> </input> <output> <port id="1" precision="FP32" /> </output> </layer> <layer id="365" name="Constant_102223" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="10" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="366" name="Constant_102225" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="2" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="367" name="Constant_102227" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="18" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="368" name="Concat_102228" type="Concat" version="opset1"> <data axis="0" /> <input> <port id="0" precision="I64"> <dim>1</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="4" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="369" name="Broadcast_102231" type="Broadcast" version="opset3"> <data mode="numpy" /> <input> <port id="0" precision="FP32" /> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>0</dim> <dim>96</dim> </port> </output> </layer> <layer id="370" name="ReadValue_101053" type="ReadValue" version="opset6"> <data variable_id="past_key_values.1.valuepresent.1.value" variable_type="f32" variable_shape="?,32,?,96" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>0</dim> <dim>96</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.1.value"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="371" name="Constant_99860" type="Const" version="opset1"> <data element_type="i64" shape="" offset="2" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="372" name="Gather_99861" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="373" name="Constant_1470" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635656" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="374" name="Constant_1472" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635638" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="375" name="Constant_1474" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="376" name="__module.model.model.layers.1.self_attn/aten::slice/Slice_6" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>9216</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="549,value_states.3"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="377" name="Constant_96594" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="56635456" size="32" /> <rt_info> <attribute name="precise" version="0" /> </rt_info> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="378" name="__module.model.model.layers.1.self_attn/aten::view/Reshape_2" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="557"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> </output> </layer> <layer id="379" name="__module.model.model.layers.1.self_attn/aten::transpose/Constant_2" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="56635488" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="380" name="__module.model.model.layers.1.self_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="558"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="381" name="__module.model.model.layers.1.self_attn/aten::cat/Concat_3" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="hidden_states.35,present.1.value"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="382" name="__module.model.model.layers.1.self_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> <data causal="false" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="2" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="3" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>-1</dim> </port> </input> <output> <port id="4" precision="FP32" names="642,attn_output.5"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="383" name="__module.model.model.layers.1.self_attn/aten::transpose/Constant_3" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="56635488" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="384" name="__module.model.model.layers.1.self_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="643"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> </output> </layer> <layer id="385" name="Constant_96595" type="Const" version="opset1"> <data element_type="i64" shape="3" offset="56635704" size="24" /> <rt_info> <attribute name="precise" version="0" /> </rt_info> <output> <port id="0" precision="I64"> <dim>3</dim> </port> </output> </layer> <layer id="386" name="__module.model.model.layers.1.self_attn/aten::view/Reshape_3" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> <port id="1" precision="I64"> <dim>3</dim> </port> </input> <output> <port id="2" precision="FP32" names="646"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="387" name="self.model.model.layers.1.self_attn.o_proj.weight_compressed" type="Const" version="opset1"> <data element_type="f16" shape="3072, 3072" offset="283140436" size="18874368" /> <output> <port id="0" precision="FP16" names="self.model.model.layers.1.self_attn.o_proj.weight"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="388" name="self.model.model.layers.1.self_attn.o_proj.weight" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="389" name="__module.model.model.layers.1.self_attn.o_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="648,650,input.7"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="390" name="__module.model.model.layers.1/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="654,656,667,hidden_states.37,hidden_states.39"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="391" name="Constant_90053_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 3072" offset="302014804" size="6144" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="392" name="Constant_90053" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="393" name="Constant_90052_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12314" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="394" name="Constant_90052" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="395" name="Constant_90050_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12316" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="396" name="Constant_90050" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="397" name="__module.model.model.layers.1.post_attention_layernorm/aten::pow/Power" type="Power" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="657"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="398" name="Constant_2332" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="12318" size="8" /> <output> <port id="0" precision="I64" names="658"> <dim>1</dim> </port> </output> </layer> <layer id="399" name="__module.model.model.layers.1.post_attention_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> <data keep_dims="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="659,variance.7"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="400" name="Constant_90051_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12326" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="401" name="Constant_90051" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="402" name="__module.model.model.layers.1.post_attention_layernorm/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="660"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="403" name="__module.model.model.layers.1.post_attention_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="404" name="__module.model.model.layers.1.post_attention_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> <data auto_broadcast="numpy" m_pythondiv="true" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="661"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="405" name="__module.model.model.layers.1.post_attention_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="662,663,hidden_states.41,hidden_states.43"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="406" name="__module.model.model.layers.1.post_attention_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="664,666"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="407" name="self.model.model.layers.1.mlp.gate_up_proj.weight_compressed" type="Const" version="opset1"> <data element_type="f16" shape="16384, 3072" offset="302020948" size="100663296" /> <output> <port id="0" precision="FP16" names="self.model.model.layers.1.mlp.gate_up_proj.weight"> <dim>16384</dim> <dim>3072</dim> </port> </output> </layer> <layer id="408" name="self.model.model.layers.1.mlp.gate_up_proj.weight" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>16384</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>16384</dim> <dim>3072</dim> </port> </output> </layer> <layer id="409" name="__module.model.model.layers.1.mlp.gate_up_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>16384</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="671,up_states.5"> <dim>-1</dim> <dim>-1</dim> <dim>16384</dim> </port> </output> </layer> <layer id="410" name="__module.model.model.layers.1.mlp/prim::ListUnpack/VariadicSplit" type="VariadicSplit" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16384</dim> </port> <port id="1" precision="I64" /> <port id="2" precision="I32"> <dim>2</dim> </port> </input> <output> <port id="3" precision="FP32" names="673,input.9"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> <port id="4" precision="FP32" names="674,up_states.7"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> </output> </layer> <layer id="411" name="__module.model.model.layers.1.mlp.activation_fn/aten::silu/Swish" type="Swish" version="opset4"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> </input> <output> <port id="1" precision="FP32" names="675"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> </output> </layer> <layer id="412" name="__module.model.model.layers.1.mlp/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> </input> <output> <port id="2" precision="FP32" names="676"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> </output> </layer> <layer id="413" name="self.model.model.layers.1.mlp.down_proj.weight_compressed" type="Const" version="opset1"> <data element_type="f16" shape="3072, 8192" offset="402684244" size="50331648" /> <output> <port id="0" precision="FP16" names="self.model.model.layers.1.mlp.down_proj.weight"> <dim>3072</dim> <dim>8192</dim> </port> </output> </layer> <layer id="414" name="self.model.model.layers.1.mlp.down_proj.weight" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>8192</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>3072</dim> <dim>8192</dim> </port> </output> </layer> <layer id="415" name="__module.model.model.layers.1.mlp.down_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> <port id="1" precision="FP32"> <dim>3072</dim> <dim>8192</dim> </port> </input> <output> <port id="2" precision="FP32" names="678,input.11"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="416" name="__module.model.model.layers.1/aten::add/Add_1" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="680,682,690,701,hidden_states.47,hidden_states.49"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="417" name="Constant_90057_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 3072" offset="453015892" size="6144" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="418" name="Constant_90057" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="419" name="Constant_90056_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12314" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="420" name="Constant_90056" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="421" name="Constant_90054_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12316" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="422" name="Constant_90054" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="423" name="__module.model.model.layers.2.input_layernorm/aten::pow/Power" type="Power" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="691"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="424" name="Constant_2401" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="12318" size="8" /> <output> <port id="0" precision="I64" names="692"> <dim>1</dim> </port> </output> </layer> <layer id="425" name="__module.model.model.layers.2.input_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> <data keep_dims="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="693,variance.9"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="426" name="Constant_90055_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12326" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="427" name="Constant_90055" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="428" name="__module.model.model.layers.2.input_layernorm/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="694"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="429" name="__module.model.model.layers.2.input_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="430" name="__module.model.model.layers.2.input_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> <data auto_broadcast="numpy" m_pythondiv="true" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="695"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="431" name="__module.model.model.layers.2.input_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="696,697,hidden_states.51,hidden_states.53"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="432" name="__module.model.model.layers.2.input_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="698,700,hidden_states.55"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="433" name="self.model.model.layers.2.self_attn.qkv_proj.weight_compressed" type="Const" version="opset1"> <data element_type="f16" shape="9216, 3072" offset="453022036" size="56623104" /> <output> <port id="0" precision="FP16" names="self.model.model.layers.2.self_attn.qkv_proj.weight"> <dim>9216</dim> <dim>3072</dim> </port> </output> </layer> <layer id="434" name="self.model.model.layers.2.self_attn.qkv_proj.weight" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>9216</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>9216</dim> <dim>3072</dim> </port> </output> </layer> <layer id="435" name="__module.model.model.layers.2.self_attn.qkv_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>9216</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="707,qkv.5"> <dim>-1</dim> <dim>-1</dim> <dim>9216</dim> </port> </output> </layer> <layer id="436" name="Constant_2444" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="2" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="437" name="Constant_2446" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635432" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="438" name="Constant_2448" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="439" name="__module.model.model.layers.2.self_attn/aten::slice/Slice" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>9216</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="708,query_states.5"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="440" name="Constant_96596" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="56635456" size="32" /> <rt_info> <attribute name="precise" version="0" /> </rt_info> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="441" name="__module.model.model.layers.2.self_attn/aten::view/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="712"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> </output> </layer> <layer id="442" name="__module.model.model.layers.2.self_attn/aten::transpose/Constant" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="56635488" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="443" name="__module.model.model.layers.2.self_attn/aten::transpose/Transpose" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="713,q.5"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="444" name="__module.model.model.layers.2.self_attn/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="762"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="445" name="Constant_3011" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635630" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="446" name="Constant_3013" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635638" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="447" name="Constant_3015" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="448" name="__module.model.model.layers.2.self_attn/aten::slice/Slice_1" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="772,x2.9"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="449" name="Constant_90058_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1, 1" offset="56635654" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="450" name="Constant_90058" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="451" name="__module.model.model.layers.2.self_attn/aten::neg/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="773"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="452" name="Constant_2908" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="2" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="453" name="Constant_2952" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635630" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="454" name="Constant_2954" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="455" name="__module.model.model.layers.2.self_attn/aten::slice/Slice_2" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="767"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="456" name="__module.model.model.layers.2.self_attn/aten::cat/Concat" type="Concat" version="opset1"> <data axis="-1" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </input> <output> <port id="2" precision="FP32" names="775"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="457" name="__module.model.model.layers.2.self_attn/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="776"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="458" name="__module.model.model.layers.2.self_attn/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="777"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="459" name="Constant_102266_compressed" type="Const" version="opset1"> <data element_type="f16" shape="" offset="0" size="2" /> <output> <port id="0" precision="FP16" /> </output> </layer> <layer id="460" name="Constant_102266" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16" /> </input> <output> <port id="1" precision="FP32" /> </output> </layer> <layer id="461" name="Constant_102259" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="10" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="462" name="Constant_102261" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="2" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="463" name="Constant_102263" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="18" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="464" name="Concat_102264" type="Concat" version="opset1"> <data axis="0" /> <input> <port id="0" precision="I64"> <dim>1</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="4" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="465" name="Broadcast_102267" type="Broadcast" version="opset3"> <data mode="numpy" /> <input> <port id="0" precision="FP32" /> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>0</dim> <dim>96</dim> </port> </output> </layer> <layer id="466" name="ReadValue_101095" type="ReadValue" version="opset6"> <data variable_id="past_key_values.2.keypresent.2.key" variable_type="f32" variable_shape="?,32,?,96" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>0</dim> <dim>96</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.2.key"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="467" name="Constant_99863" type="Const" version="opset1"> <data element_type="i64" shape="" offset="2" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="468" name="Gather_99864" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="469" name="Constant_2454" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635432" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="470" name="Constant_2456" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635656" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="471" name="Constant_2458" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="472" name="__module.model.model.layers.2.self_attn/aten::slice/Slice_3" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>9216</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="709,key_states.13"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="473" name="Constant_96597" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="56635456" size="32" /> <rt_info> <attribute name="precise" version="0" /> </rt_info> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="474" name="__module.model.model.layers.2.self_attn/aten::view/Reshape_1" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="715"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> </output> </layer> <layer id="475" name="__module.model.model.layers.2.self_attn/aten::transpose/Constant_1" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="56635488" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="476" name="__module.model.model.layers.2.self_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="716,key_states.15"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="477" name="__module.model.model.layers.2.self_attn/aten::mul/Multiply_2" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="778"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="478" name="Constant_3154" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635630" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="479" name="Constant_3156" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635638" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="480" name="Constant_3158" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="481" name="__module.model.model.layers.2.self_attn/aten::slice/Slice_4" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="788,x2.11"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="482" name="Constant_90059_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1, 1" offset="56635654" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="483" name="Constant_90059" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="484" name="__module.model.model.layers.2.self_attn/aten::neg/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="789"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="485" name="Constant_3051" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="2" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="486" name="Constant_3095" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635630" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="487" name="Constant_3097" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="488" name="__module.model.model.layers.2.self_attn/aten::slice/Slice_5" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="783"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="489" name="__module.model.model.layers.2.self_attn/aten::cat/Concat_1" type="Concat" version="opset1"> <data axis="-1" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </input> <output> <port id="2" precision="FP32" names="791"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="490" name="__module.model.model.layers.2.self_attn/aten::mul/Multiply_3" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="792"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="491" name="__module.model.model.layers.2.self_attn/aten::add/Add_1" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="793"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="492" name="__module.model.model.layers.2.self_attn/aten::cat/Concat_2" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="hidden_states.57,present.2.key"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="493" name="Constant_102254_compressed" type="Const" version="opset1"> <data element_type="f16" shape="" offset="0" size="2" /> <output> <port id="0" precision="FP16" /> </output> </layer> <layer id="494" name="Constant_102254" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16" /> </input> <output> <port id="1" precision="FP32" /> </output> </layer> <layer id="495" name="Constant_102247" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="10" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="496" name="Constant_102249" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="2" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="497" name="Constant_102251" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="18" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="498" name="Concat_102252" type="Concat" version="opset1"> <data axis="0" /> <input> <port id="0" precision="I64"> <dim>1</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="4" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="499" name="Broadcast_102255" type="Broadcast" version="opset3"> <data mode="numpy" /> <input> <port id="0" precision="FP32" /> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>0</dim> <dim>96</dim> </port> </output> </layer> <layer id="500" name="ReadValue_101097" type="ReadValue" version="opset6"> <data variable_id="past_key_values.2.valuepresent.2.value" variable_type="f32" variable_shape="?,32,?,96" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>0</dim> <dim>96</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.2.value"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="501" name="Constant_99866" type="Const" version="opset1"> <data element_type="i64" shape="" offset="2" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="502" name="Gather_99867" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="503" name="Constant_2464" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635656" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="504" name="Constant_2466" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635638" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="505" name="Constant_2468" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="506" name="__module.model.model.layers.2.self_attn/aten::slice/Slice_6" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>9216</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="710,value_states.5"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="507" name="Constant_96598" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="56635456" size="32" /> <rt_info> <attribute name="precise" version="0" /> </rt_info> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="508" name="__module.model.model.layers.2.self_attn/aten::view/Reshape_2" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="718"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> </output> </layer> <layer id="509" name="__module.model.model.layers.2.self_attn/aten::transpose/Constant_2" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="56635488" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="510" name="__module.model.model.layers.2.self_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="719"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="511" name="__module.model.model.layers.2.self_attn/aten::cat/Concat_3" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="hidden_states.59,present.2.value"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="512" name="__module.model.model.layers.2.self_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> <data causal="false" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="2" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="3" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>-1</dim> </port> </input> <output> <port id="4" precision="FP32" names="803,attn_output.9"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="513" name="__module.model.model.layers.2.self_attn/aten::transpose/Constant_3" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="56635488" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="514" name="__module.model.model.layers.2.self_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="804"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> </output> </layer> <layer id="515" name="Constant_96599" type="Const" version="opset1"> <data element_type="i64" shape="3" offset="56635704" size="24" /> <rt_info> <attribute name="precise" version="0" /> </rt_info> <output> <port id="0" precision="I64"> <dim>3</dim> </port> </output> </layer> <layer id="516" name="__module.model.model.layers.2.self_attn/aten::view/Reshape_3" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> <port id="1" precision="I64"> <dim>3</dim> </port> </input> <output> <port id="2" precision="FP32" names="807"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="517" name="self.model.model.layers.2.self_attn.o_proj.weight_compressed" type="Const" version="opset1"> <data element_type="f16" shape="3072, 3072" offset="509645140" size="18874368" /> <output> <port id="0" precision="FP16" names="self.model.model.layers.2.self_attn.o_proj.weight"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="518" name="self.model.model.layers.2.self_attn.o_proj.weight" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="519" name="__module.model.model.layers.2.self_attn.o_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="809,811,input.13"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="520" name="__module.model.model.layers.2/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="815,817,828,hidden_states.61,hidden_states.63"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="521" name="Constant_90063_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 3072" offset="528519508" size="6144" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="522" name="Constant_90063" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="523" name="Constant_90062_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12314" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="524" name="Constant_90062" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="525" name="Constant_90060_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12316" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="526" name="Constant_90060" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="527" name="__module.model.model.layers.2.post_attention_layernorm/aten::pow/Power" type="Power" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="818"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="528" name="Constant_3326" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="12318" size="8" /> <output> <port id="0" precision="I64" names="819"> <dim>1</dim> </port> </output> </layer> <layer id="529" name="__module.model.model.layers.2.post_attention_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> <data keep_dims="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="820,variance.11"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="530" name="Constant_90061_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12326" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="531" name="Constant_90061" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="532" name="__module.model.model.layers.2.post_attention_layernorm/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="821"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="533" name="__module.model.model.layers.2.post_attention_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="534" name="__module.model.model.layers.2.post_attention_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> <data auto_broadcast="numpy" m_pythondiv="true" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="822"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="535" name="__module.model.model.layers.2.post_attention_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="823,824,hidden_states.65,hidden_states.67"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="536" name="__module.model.model.layers.2.post_attention_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="825,827"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="537" name="self.model.model.layers.2.mlp.gate_up_proj.weight_compressed" type="Const" version="opset1"> <data element_type="f16" shape="16384, 3072" offset="528525652" size="100663296" /> <output> <port id="0" precision="FP16" names="self.model.model.layers.2.mlp.gate_up_proj.weight"> <dim>16384</dim> <dim>3072</dim> </port> </output> </layer> <layer id="538" name="self.model.model.layers.2.mlp.gate_up_proj.weight" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>16384</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>16384</dim> <dim>3072</dim> </port> </output> </layer> <layer id="539" name="__module.model.model.layers.2.mlp.gate_up_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>16384</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="832,up_states.9"> <dim>-1</dim> <dim>-1</dim> <dim>16384</dim> </port> </output> </layer> <layer id="540" name="__module.model.model.layers.2.mlp/prim::ListUnpack/VariadicSplit" type="VariadicSplit" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16384</dim> </port> <port id="1" precision="I64" /> <port id="2" precision="I32"> <dim>2</dim> </port> </input> <output> <port id="3" precision="FP32" names="834,input.15"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> <port id="4" precision="FP32" names="835,up_states.11"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> </output> </layer> <layer id="541" name="__module.model.model.layers.2.mlp.activation_fn/aten::silu/Swish" type="Swish" version="opset4"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> </input> <output> <port id="1" precision="FP32" names="836"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> </output> </layer> <layer id="542" name="__module.model.model.layers.2.mlp/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> </input> <output> <port id="2" precision="FP32" names="837"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> </output> </layer> <layer id="543" name="self.model.model.layers.2.mlp.down_proj.weight_compressed" type="Const" version="opset1"> <data element_type="f16" shape="3072, 8192" offset="629188948" size="50331648" /> <output> <port id="0" precision="FP16" names="self.model.model.layers.2.mlp.down_proj.weight"> <dim>3072</dim> <dim>8192</dim> </port> </output> </layer> <layer id="544" name="self.model.model.layers.2.mlp.down_proj.weight" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>8192</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>3072</dim> <dim>8192</dim> </port> </output> </layer> <layer id="545" name="__module.model.model.layers.2.mlp.down_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> <port id="1" precision="FP32"> <dim>3072</dim> <dim>8192</dim> </port> </input> <output> <port id="2" precision="FP32" names="839,input.17"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="546" name="__module.model.model.layers.2/aten::add/Add_1" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="841,843,851,862,hidden_states.71,hidden_states.73"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="547" name="Constant_90067_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 3072" offset="679520596" size="6144" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="548" name="Constant_90067" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="549" name="Constant_90066_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12314" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="550" name="Constant_90066" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="551" name="Constant_90064_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12316" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="552" name="Constant_90064" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="553" name="__module.model.model.layers.3.input_layernorm/aten::pow/Power" type="Power" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="852"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="554" name="Constant_3395" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="12318" size="8" /> <output> <port id="0" precision="I64" names="853"> <dim>1</dim> </port> </output> </layer> <layer id="555" name="__module.model.model.layers.3.input_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> <data keep_dims="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="854,variance.13"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="556" name="Constant_90065_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12326" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="557" name="Constant_90065" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="558" name="__module.model.model.layers.3.input_layernorm/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="855"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="559" name="__module.model.model.layers.3.input_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="560" name="__module.model.model.layers.3.input_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> <data auto_broadcast="numpy" m_pythondiv="true" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="856"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="561" name="__module.model.model.layers.3.input_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="857,858,hidden_states.75,hidden_states.77"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="562" name="__module.model.model.layers.3.input_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="859,861,hidden_states.79"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="563" name="self.model.model.layers.3.self_attn.qkv_proj.weight_compressed" type="Const" version="opset1"> <data element_type="f16" shape="9216, 3072" offset="679526740" size="56623104" /> <output> <port id="0" precision="FP16" names="self.model.model.layers.3.self_attn.qkv_proj.weight"> <dim>9216</dim> <dim>3072</dim> </port> </output> </layer> <layer id="564" name="self.model.model.layers.3.self_attn.qkv_proj.weight" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>9216</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>9216</dim> <dim>3072</dim> </port> </output> </layer> <layer id="565" name="__module.model.model.layers.3.self_attn.qkv_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>9216</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="868,qkv.7"> <dim>-1</dim> <dim>-1</dim> <dim>9216</dim> </port> </output> </layer> <layer id="566" name="Constant_3438" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="2" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="567" name="Constant_3440" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635432" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="568" name="Constant_3442" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="569" name="__module.model.model.layers.3.self_attn/aten::slice/Slice" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>9216</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="869,query_states.7"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="570" name="Constant_96600" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="56635456" size="32" /> <rt_info> <attribute name="precise" version="0" /> </rt_info> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="571" name="__module.model.model.layers.3.self_attn/aten::view/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="873"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> </output> </layer> <layer id="572" name="__module.model.model.layers.3.self_attn/aten::transpose/Constant" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="56635488" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="573" name="__module.model.model.layers.3.self_attn/aten::transpose/Transpose" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="874,q.7"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="574" name="__module.model.model.layers.3.self_attn/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="923"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="575" name="Constant_4005" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635630" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="576" name="Constant_4007" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635638" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="577" name="Constant_4009" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="578" name="__module.model.model.layers.3.self_attn/aten::slice/Slice_1" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="933,x2.13"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="579" name="Constant_90068_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1, 1" offset="56635654" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="580" name="Constant_90068" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="581" name="__module.model.model.layers.3.self_attn/aten::neg/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="934"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="582" name="Constant_3902" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="2" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="583" name="Constant_3946" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635630" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="584" name="Constant_3948" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="585" name="__module.model.model.layers.3.self_attn/aten::slice/Slice_2" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="928"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="586" name="__module.model.model.layers.3.self_attn/aten::cat/Concat" type="Concat" version="opset1"> <data axis="-1" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </input> <output> <port id="2" precision="FP32" names="936"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="587" name="__module.model.model.layers.3.self_attn/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="937"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="588" name="__module.model.model.layers.3.self_attn/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="938"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="589" name="Constant_102290_compressed" type="Const" version="opset1"> <data element_type="f16" shape="" offset="0" size="2" /> <output> <port id="0" precision="FP16" /> </output> </layer> <layer id="590" name="Constant_102290" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16" /> </input> <output> <port id="1" precision="FP32" /> </output> </layer> <layer id="591" name="Constant_102283" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="10" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="592" name="Constant_102285" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="2" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="593" name="Constant_102287" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="18" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="594" name="Concat_102288" type="Concat" version="opset1"> <data axis="0" /> <input> <port id="0" precision="I64"> <dim>1</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="4" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="595" name="Broadcast_102291" type="Broadcast" version="opset3"> <data mode="numpy" /> <input> <port id="0" precision="FP32" /> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>0</dim> <dim>96</dim> </port> </output> </layer> <layer id="596" name="ReadValue_101139" type="ReadValue" version="opset6"> <data variable_id="past_key_values.3.keypresent.3.key" variable_type="f32" variable_shape="?,32,?,96" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>0</dim> <dim>96</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.3.key"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="597" name="Constant_99869" type="Const" version="opset1"> <data element_type="i64" shape="" offset="2" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="598" name="Gather_99870" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="599" name="Constant_3448" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635432" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="600" name="Constant_3450" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635656" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="601" name="Constant_3452" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="602" name="__module.model.model.layers.3.self_attn/aten::slice/Slice_3" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>9216</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="870,key_states.17"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="603" name="Constant_96601" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="56635456" size="32" /> <rt_info> <attribute name="precise" version="0" /> </rt_info> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="604" name="__module.model.model.layers.3.self_attn/aten::view/Reshape_1" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="876"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> </output> </layer> <layer id="605" name="__module.model.model.layers.3.self_attn/aten::transpose/Constant_1" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="56635488" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="606" name="__module.model.model.layers.3.self_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="877,key_states.19"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="607" name="__module.model.model.layers.3.self_attn/aten::mul/Multiply_2" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="939"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="608" name="Constant_4148" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635630" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="609" name="Constant_4150" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635638" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="610" name="Constant_4152" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="611" name="__module.model.model.layers.3.self_attn/aten::slice/Slice_4" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="949,x2.15"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="612" name="Constant_90069_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1, 1" offset="56635654" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="613" name="Constant_90069" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="614" name="__module.model.model.layers.3.self_attn/aten::neg/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="950"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="615" name="Constant_4045" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="2" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="616" name="Constant_4089" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635630" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="617" name="Constant_4091" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="618" name="__module.model.model.layers.3.self_attn/aten::slice/Slice_5" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="944"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="619" name="__module.model.model.layers.3.self_attn/aten::cat/Concat_1" type="Concat" version="opset1"> <data axis="-1" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </input> <output> <port id="2" precision="FP32" names="952"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="620" name="__module.model.model.layers.3.self_attn/aten::mul/Multiply_3" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="953"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="621" name="__module.model.model.layers.3.self_attn/aten::add/Add_1" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="954"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="622" name="__module.model.model.layers.3.self_attn/aten::cat/Concat_2" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="hidden_states.81,present.3.key"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="623" name="Constant_102278_compressed" type="Const" version="opset1"> <data element_type="f16" shape="" offset="0" size="2" /> <output> <port id="0" precision="FP16" /> </output> </layer> <layer id="624" name="Constant_102278" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16" /> </input> <output> <port id="1" precision="FP32" /> </output> </layer> <layer id="625" name="Constant_102271" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="10" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="626" name="Constant_102273" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="2" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="627" name="Constant_102275" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="18" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="628" name="Concat_102276" type="Concat" version="opset1"> <data axis="0" /> <input> <port id="0" precision="I64"> <dim>1</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="4" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="629" name="Broadcast_102279" type="Broadcast" version="opset3"> <data mode="numpy" /> <input> <port id="0" precision="FP32" /> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>0</dim> <dim>96</dim> </port> </output> </layer> <layer id="630" name="ReadValue_101141" type="ReadValue" version="opset6"> <data variable_id="past_key_values.3.valuepresent.3.value" variable_type="f32" variable_shape="?,32,?,96" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>0</dim> <dim>96</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.3.value"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="631" name="Constant_99872" type="Const" version="opset1"> <data element_type="i64" shape="" offset="2" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="632" name="Gather_99873" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="633" name="Constant_3458" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635656" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="634" name="Constant_3460" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635638" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="635" name="Constant_3462" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="636" name="__module.model.model.layers.3.self_attn/aten::slice/Slice_6" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>9216</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="871,value_states.7"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="637" name="Constant_96602" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="56635456" size="32" /> <rt_info> <attribute name="precise" version="0" /> </rt_info> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="638" name="__module.model.model.layers.3.self_attn/aten::view/Reshape_2" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="879"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> </output> </layer> <layer id="639" name="__module.model.model.layers.3.self_attn/aten::transpose/Constant_2" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="56635488" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="640" name="__module.model.model.layers.3.self_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="880"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="641" name="__module.model.model.layers.3.self_attn/aten::cat/Concat_3" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="hidden_states.83,present.3.value"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="642" name="__module.model.model.layers.3.self_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> <data causal="false" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="2" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="3" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>-1</dim> </port> </input> <output> <port id="4" precision="FP32" names="964,attn_output.13"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="643" name="__module.model.model.layers.3.self_attn/aten::transpose/Constant_3" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="56635488" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="644" name="__module.model.model.layers.3.self_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="965"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> </output> </layer> <layer id="645" name="Constant_96603" type="Const" version="opset1"> <data element_type="i64" shape="3" offset="56635704" size="24" /> <rt_info> <attribute name="precise" version="0" /> </rt_info> <output> <port id="0" precision="I64"> <dim>3</dim> </port> </output> </layer> <layer id="646" name="__module.model.model.layers.3.self_attn/aten::view/Reshape_3" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> <port id="1" precision="I64"> <dim>3</dim> </port> </input> <output> <port id="2" precision="FP32" names="968"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="647" name="self.model.model.layers.3.self_attn.o_proj.weight_compressed" type="Const" version="opset1"> <data element_type="f16" shape="3072, 3072" offset="736149844" size="18874368" /> <output> <port id="0" precision="FP16" names="self.model.model.layers.3.self_attn.o_proj.weight"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="648" name="self.model.model.layers.3.self_attn.o_proj.weight" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="649" name="__module.model.model.layers.3.self_attn.o_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="970,972,input.19"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="650" name="__module.model.model.layers.3/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="976,978,989,hidden_states.85,hidden_states.87"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="651" name="Constant_90073_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 3072" offset="755024212" size="6144" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="652" name="Constant_90073" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="653" name="Constant_90072_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12314" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="654" name="Constant_90072" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="655" name="Constant_90070_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12316" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="656" name="Constant_90070" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="657" name="__module.model.model.layers.3.post_attention_layernorm/aten::pow/Power" type="Power" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="979"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="658" name="Constant_4320" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="12318" size="8" /> <output> <port id="0" precision="I64" names="980"> <dim>1</dim> </port> </output> </layer> <layer id="659" name="__module.model.model.layers.3.post_attention_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> <data keep_dims="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="981,variance.15"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="660" name="Constant_90071_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12326" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="661" name="Constant_90071" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="662" name="__module.model.model.layers.3.post_attention_layernorm/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="982"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="663" name="__module.model.model.layers.3.post_attention_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="664" name="__module.model.model.layers.3.post_attention_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> <data auto_broadcast="numpy" m_pythondiv="true" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="983"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="665" name="__module.model.model.layers.3.post_attention_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="984,985,hidden_states.89,hidden_states.91"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="666" name="__module.model.model.layers.3.post_attention_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="986,988"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="667" name="self.model.model.layers.3.mlp.gate_up_proj.weight_compressed" type="Const" version="opset1"> <data element_type="f16" shape="16384, 3072" offset="755030356" size="100663296" /> <output> <port id="0" precision="FP16" names="self.model.model.layers.3.mlp.gate_up_proj.weight"> <dim>16384</dim> <dim>3072</dim> </port> </output> </layer> <layer id="668" name="self.model.model.layers.3.mlp.gate_up_proj.weight" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>16384</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>16384</dim> <dim>3072</dim> </port> </output> </layer> <layer id="669" name="__module.model.model.layers.3.mlp.gate_up_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>16384</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="993,up_states.13"> <dim>-1</dim> <dim>-1</dim> <dim>16384</dim> </port> </output> </layer> <layer id="670" name="__module.model.model.layers.3.mlp/prim::ListUnpack/VariadicSplit" type="VariadicSplit" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16384</dim> </port> <port id="1" precision="I64" /> <port id="2" precision="I32"> <dim>2</dim> </port> </input> <output> <port id="3" precision="FP32" names="995,input.21"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> <port id="4" precision="FP32" names="996,up_states.15"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> </output> </layer> <layer id="671" name="__module.model.model.layers.3.mlp.activation_fn/aten::silu/Swish" type="Swish" version="opset4"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> </input> <output> <port id="1" precision="FP32" names="997"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> </output> </layer> <layer id="672" name="__module.model.model.layers.3.mlp/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> </input> <output> <port id="2" precision="FP32" names="998"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> </output> </layer> <layer id="673" name="self.model.model.layers.3.mlp.down_proj.weight_compressed" type="Const" version="opset1"> <data element_type="f16" shape="3072, 8192" offset="855693652" size="50331648" /> <output> <port id="0" precision="FP16" names="self.model.model.layers.3.mlp.down_proj.weight"> <dim>3072</dim> <dim>8192</dim> </port> </output> </layer> <layer id="674" name="self.model.model.layers.3.mlp.down_proj.weight" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>8192</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>3072</dim> <dim>8192</dim> </port> </output> </layer> <layer id="675" name="__module.model.model.layers.3.mlp.down_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> <port id="1" precision="FP32"> <dim>3072</dim> <dim>8192</dim> </port> </input> <output> <port id="2" precision="FP32" names="1000,input.23"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="676" name="__module.model.model.layers.3/aten::add/Add_1" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="1002,1004,1012,1023,hidden_states.95,hidden_states.97"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="677" name="Constant_90077_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 3072" offset="906025300" size="6144" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="678" name="Constant_90077" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="679" name="Constant_90076_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12314" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="680" name="Constant_90076" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="681" name="Constant_90074_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12316" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="682" name="Constant_90074" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="683" name="__module.model.model.layers.4.input_layernorm/aten::pow/Power" type="Power" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="1013"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="684" name="Constant_4389" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="12318" size="8" /> <output> <port id="0" precision="I64" names="1014"> <dim>1</dim> </port> </output> </layer> <layer id="685" name="__module.model.model.layers.4.input_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> <data keep_dims="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="1015,variance.17"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="686" name="Constant_90075_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12326" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="687" name="Constant_90075" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="688" name="__module.model.model.layers.4.input_layernorm/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="1016"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="689" name="__module.model.model.layers.4.input_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="690" name="__module.model.model.layers.4.input_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> <data auto_broadcast="numpy" m_pythondiv="true" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="1017"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="691" name="__module.model.model.layers.4.input_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="1018,1019,hidden_states.101,hidden_states.99"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="692" name="__module.model.model.layers.4.input_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="1020,1022,hidden_states.103"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="693" name="self.model.model.layers.4.self_attn.qkv_proj.weight_compressed" type="Const" version="opset1"> <data element_type="f16" shape="9216, 3072" offset="906031444" size="56623104" /> <output> <port id="0" precision="FP16" names="self.model.model.layers.4.self_attn.qkv_proj.weight"> <dim>9216</dim> <dim>3072</dim> </port> </output> </layer> <layer id="694" name="self.model.model.layers.4.self_attn.qkv_proj.weight" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>9216</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>9216</dim> <dim>3072</dim> </port> </output> </layer> <layer id="695" name="__module.model.model.layers.4.self_attn.qkv_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>9216</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="1029,qkv.9"> <dim>-1</dim> <dim>-1</dim> <dim>9216</dim> </port> </output> </layer> <layer id="696" name="Constant_4432" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="2" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="697" name="Constant_4434" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635432" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="698" name="Constant_4436" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="699" name="__module.model.model.layers.4.self_attn/aten::slice/Slice" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>9216</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="1030,query_states.9"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="700" name="Constant_96604" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="56635456" size="32" /> <rt_info> <attribute name="precise" version="0" /> </rt_info> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="701" name="__module.model.model.layers.4.self_attn/aten::view/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1034"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> </output> </layer> <layer id="702" name="__module.model.model.layers.4.self_attn/aten::transpose/Constant" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="56635488" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="703" name="__module.model.model.layers.4.self_attn/aten::transpose/Transpose" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1035,q.9"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="704" name="__module.model.model.layers.4.self_attn/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="1084"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="705" name="Constant_4999" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635630" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="706" name="Constant_5001" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635638" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="707" name="Constant_5003" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="708" name="__module.model.model.layers.4.self_attn/aten::slice/Slice_1" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="1094,x2.17"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="709" name="Constant_90078_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1, 1" offset="56635654" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="710" name="Constant_90078" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="711" name="__module.model.model.layers.4.self_attn/aten::neg/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="1095"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="712" name="Constant_4896" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="2" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="713" name="Constant_4940" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635630" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="714" name="Constant_4942" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="715" name="__module.model.model.layers.4.self_attn/aten::slice/Slice_2" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="1089"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="716" name="__module.model.model.layers.4.self_attn/aten::cat/Concat" type="Concat" version="opset1"> <data axis="-1" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </input> <output> <port id="2" precision="FP32" names="1097"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="717" name="__module.model.model.layers.4.self_attn/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="1098"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="718" name="__module.model.model.layers.4.self_attn/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="1099"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="719" name="Constant_102314_compressed" type="Const" version="opset1"> <data element_type="f16" shape="" offset="0" size="2" /> <output> <port id="0" precision="FP16" /> </output> </layer> <layer id="720" name="Constant_102314" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16" /> </input> <output> <port id="1" precision="FP32" /> </output> </layer> <layer id="721" name="Constant_102307" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="10" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="722" name="Constant_102309" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="2" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="723" name="Constant_102311" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="18" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="724" name="Concat_102312" type="Concat" version="opset1"> <data axis="0" /> <input> <port id="0" precision="I64"> <dim>1</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="4" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="725" name="Broadcast_102315" type="Broadcast" version="opset3"> <data mode="numpy" /> <input> <port id="0" precision="FP32" /> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>0</dim> <dim>96</dim> </port> </output> </layer> <layer id="726" name="ReadValue_101151" type="ReadValue" version="opset6"> <data variable_id="past_key_values.4.keypresent.4.key" variable_type="f32" variable_shape="?,32,?,96" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>0</dim> <dim>96</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.4.key"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="727" name="Constant_99875" type="Const" version="opset1"> <data element_type="i64" shape="" offset="2" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="728" name="Gather_99876" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="729" name="Constant_4442" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635432" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="730" name="Constant_4444" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635656" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="731" name="Constant_4446" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="732" name="__module.model.model.layers.4.self_attn/aten::slice/Slice_3" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>9216</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="1031,key_states.21"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="733" name="Constant_96605" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="56635456" size="32" /> <rt_info> <attribute name="precise" version="0" /> </rt_info> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="734" name="__module.model.model.layers.4.self_attn/aten::view/Reshape_1" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1037"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> </output> </layer> <layer id="735" name="__module.model.model.layers.4.self_attn/aten::transpose/Constant_1" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="56635488" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="736" name="__module.model.model.layers.4.self_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1038,key_states.23"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="737" name="__module.model.model.layers.4.self_attn/aten::mul/Multiply_2" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="1100"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="738" name="Constant_5142" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635630" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="739" name="Constant_5144" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635638" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="740" name="Constant_5146" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="741" name="__module.model.model.layers.4.self_attn/aten::slice/Slice_4" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="1110,x2.19"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="742" name="Constant_90079_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1, 1" offset="56635654" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="743" name="Constant_90079" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="744" name="__module.model.model.layers.4.self_attn/aten::neg/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="1111"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="745" name="Constant_5039" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="2" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="746" name="Constant_5083" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635630" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="747" name="Constant_5085" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="748" name="__module.model.model.layers.4.self_attn/aten::slice/Slice_5" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="1105"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="749" name="__module.model.model.layers.4.self_attn/aten::cat/Concat_1" type="Concat" version="opset1"> <data axis="-1" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </input> <output> <port id="2" precision="FP32" names="1113"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="750" name="__module.model.model.layers.4.self_attn/aten::mul/Multiply_3" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="1114"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="751" name="__module.model.model.layers.4.self_attn/aten::add/Add_1" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="1115"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="752" name="__module.model.model.layers.4.self_attn/aten::cat/Concat_2" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="hidden_states.105,present.4.key"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="753" name="Constant_102302_compressed" type="Const" version="opset1"> <data element_type="f16" shape="" offset="0" size="2" /> <output> <port id="0" precision="FP16" /> </output> </layer> <layer id="754" name="Constant_102302" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16" /> </input> <output> <port id="1" precision="FP32" /> </output> </layer> <layer id="755" name="Constant_102295" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="10" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="756" name="Constant_102297" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="2" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="757" name="Constant_102299" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="18" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="758" name="Concat_102300" type="Concat" version="opset1"> <data axis="0" /> <input> <port id="0" precision="I64"> <dim>1</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="4" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="759" name="Broadcast_102303" type="Broadcast" version="opset3"> <data mode="numpy" /> <input> <port id="0" precision="FP32" /> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>0</dim> <dim>96</dim> </port> </output> </layer> <layer id="760" name="ReadValue_101153" type="ReadValue" version="opset6"> <data variable_id="past_key_values.4.valuepresent.4.value" variable_type="f32" variable_shape="?,32,?,96" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>0</dim> <dim>96</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.4.value"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="761" name="Constant_99878" type="Const" version="opset1"> <data element_type="i64" shape="" offset="2" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="762" name="Gather_99879" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="763" name="Constant_4452" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635656" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="764" name="Constant_4454" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635638" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="765" name="Constant_4456" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="766" name="__module.model.model.layers.4.self_attn/aten::slice/Slice_6" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>9216</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="1032,value_states.9"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="767" name="Constant_96606" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="56635456" size="32" /> <rt_info> <attribute name="precise" version="0" /> </rt_info> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="768" name="__module.model.model.layers.4.self_attn/aten::view/Reshape_2" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1040"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> </output> </layer> <layer id="769" name="__module.model.model.layers.4.self_attn/aten::transpose/Constant_2" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="56635488" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="770" name="__module.model.model.layers.4.self_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1041"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="771" name="__module.model.model.layers.4.self_attn/aten::cat/Concat_3" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="hidden_states.107,present.4.value"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="772" name="__module.model.model.layers.4.self_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> <data causal="false" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="2" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="3" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>-1</dim> </port> </input> <output> <port id="4" precision="FP32" names="1125,attn_output.17"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="773" name="__module.model.model.layers.4.self_attn/aten::transpose/Constant_3" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="56635488" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="774" name="__module.model.model.layers.4.self_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1126"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> </output> </layer> <layer id="775" name="Constant_96607" type="Const" version="opset1"> <data element_type="i64" shape="3" offset="56635704" size="24" /> <rt_info> <attribute name="precise" version="0" /> </rt_info> <output> <port id="0" precision="I64"> <dim>3</dim> </port> </output> </layer> <layer id="776" name="__module.model.model.layers.4.self_attn/aten::view/Reshape_3" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> <port id="1" precision="I64"> <dim>3</dim> </port> </input> <output> <port id="2" precision="FP32" names="1129"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="777" name="self.model.model.layers.4.self_attn.o_proj.weight_compressed" type="Const" version="opset1"> <data element_type="f16" shape="3072, 3072" offset="962654548" size="18874368" /> <output> <port id="0" precision="FP16" names="self.model.model.layers.4.self_attn.o_proj.weight"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="778" name="self.model.model.layers.4.self_attn.o_proj.weight" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="779" name="__module.model.model.layers.4.self_attn.o_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="1131,1133,input.25"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="780" name="__module.model.model.layers.4/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="1137,1139,1150,hidden_states.109,hidden_states.111"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="781" name="Constant_90083_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 3072" offset="981528916" size="6144" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="782" name="Constant_90083" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="783" name="Constant_90082_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12314" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="784" name="Constant_90082" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="785" name="Constant_90080_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12316" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="786" name="Constant_90080" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="787" name="__module.model.model.layers.4.post_attention_layernorm/aten::pow/Power" type="Power" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="1140"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="788" name="Constant_5314" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="12318" size="8" /> <output> <port id="0" precision="I64" names="1141"> <dim>1</dim> </port> </output> </layer> <layer id="789" name="__module.model.model.layers.4.post_attention_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> <data keep_dims="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="1142,variance.19"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="790" name="Constant_90081_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12326" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="791" name="Constant_90081" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="792" name="__module.model.model.layers.4.post_attention_layernorm/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="1143"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="793" name="__module.model.model.layers.4.post_attention_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="794" name="__module.model.model.layers.4.post_attention_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> <data auto_broadcast="numpy" m_pythondiv="true" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="1144"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="795" name="__module.model.model.layers.4.post_attention_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="1145,1146,hidden_states.113,hidden_states.115"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="796" name="__module.model.model.layers.4.post_attention_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="1147,1149"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="797" name="self.model.model.layers.4.mlp.gate_up_proj.weight_compressed" type="Const" version="opset1"> <data element_type="f16" shape="16384, 3072" offset="981535060" size="100663296" /> <output> <port id="0" precision="FP16" names="self.model.model.layers.4.mlp.gate_up_proj.weight"> <dim>16384</dim> <dim>3072</dim> </port> </output> </layer> <layer id="798" name="self.model.model.layers.4.mlp.gate_up_proj.weight" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>16384</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>16384</dim> <dim>3072</dim> </port> </output> </layer> <layer id="799" name="__module.model.model.layers.4.mlp.gate_up_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>16384</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="1154,up_states.17"> <dim>-1</dim> <dim>-1</dim> <dim>16384</dim> </port> </output> </layer> <layer id="800" name="__module.model.model.layers.4.mlp/prim::ListUnpack/VariadicSplit" type="VariadicSplit" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16384</dim> </port> <port id="1" precision="I64" /> <port id="2" precision="I32"> <dim>2</dim> </port> </input> <output> <port id="3" precision="FP32" names="1156,input.27"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> <port id="4" precision="FP32" names="1157,up_states.19"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> </output> </layer> <layer id="801" name="__module.model.model.layers.4.mlp.activation_fn/aten::silu/Swish" type="Swish" version="opset4"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> </input> <output> <port id="1" precision="FP32" names="1158"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> </output> </layer> <layer id="802" name="__module.model.model.layers.4.mlp/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> </input> <output> <port id="2" precision="FP32" names="1159"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> </output> </layer> <layer id="803" name="self.model.model.layers.4.mlp.down_proj.weight_compressed" type="Const" version="opset1"> <data element_type="f16" shape="3072, 8192" offset="1082198356" size="50331648" /> <output> <port id="0" precision="FP16" names="self.model.model.layers.4.mlp.down_proj.weight"> <dim>3072</dim> <dim>8192</dim> </port> </output> </layer> <layer id="804" name="self.model.model.layers.4.mlp.down_proj.weight" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>8192</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>3072</dim> <dim>8192</dim> </port> </output> </layer> <layer id="805" name="__module.model.model.layers.4.mlp.down_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> <port id="1" precision="FP32"> <dim>3072</dim> <dim>8192</dim> </port> </input> <output> <port id="2" precision="FP32" names="1161,input.29"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="806" name="__module.model.model.layers.4/aten::add/Add_1" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="1163,1165,1173,1184,hidden_states.119,hidden_states.121"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="807" name="Constant_90087_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 3072" offset="1132530004" size="6144" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="808" name="Constant_90087" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="809" name="Constant_90086_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12314" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="810" name="Constant_90086" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="811" name="Constant_90084_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12316" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="812" name="Constant_90084" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="813" name="__module.model.model.layers.5.input_layernorm/aten::pow/Power" type="Power" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="1174"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="814" name="Constant_5383" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="12318" size="8" /> <output> <port id="0" precision="I64" names="1175"> <dim>1</dim> </port> </output> </layer> <layer id="815" name="__module.model.model.layers.5.input_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> <data keep_dims="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="1176,variance.21"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="816" name="Constant_90085_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12326" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="817" name="Constant_90085" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="818" name="__module.model.model.layers.5.input_layernorm/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="1177"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="819" name="__module.model.model.layers.5.input_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="820" name="__module.model.model.layers.5.input_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> <data auto_broadcast="numpy" m_pythondiv="true" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="1178"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="821" name="__module.model.model.layers.5.input_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="1179,1180,hidden_states.123,hidden_states.125"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="822" name="__module.model.model.layers.5.input_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="1181,1183,hidden_states.127"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="823" name="self.model.model.layers.5.self_attn.qkv_proj.weight_compressed" type="Const" version="opset1"> <data element_type="f16" shape="9216, 3072" offset="1132536148" size="56623104" /> <output> <port id="0" precision="FP16" names="self.model.model.layers.5.self_attn.qkv_proj.weight"> <dim>9216</dim> <dim>3072</dim> </port> </output> </layer> <layer id="824" name="self.model.model.layers.5.self_attn.qkv_proj.weight" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>9216</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>9216</dim> <dim>3072</dim> </port> </output> </layer> <layer id="825" name="__module.model.model.layers.5.self_attn.qkv_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>9216</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="1190,qkv.11"> <dim>-1</dim> <dim>-1</dim> <dim>9216</dim> </port> </output> </layer> <layer id="826" name="Constant_5426" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="2" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="827" name="Constant_5428" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635432" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="828" name="Constant_5430" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="829" name="__module.model.model.layers.5.self_attn/aten::slice/Slice" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>9216</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="1191,query_states.11"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="830" name="Constant_96608" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="56635456" size="32" /> <rt_info> <attribute name="precise" version="0" /> </rt_info> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="831" name="__module.model.model.layers.5.self_attn/aten::view/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1195"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> </output> </layer> <layer id="832" name="__module.model.model.layers.5.self_attn/aten::transpose/Constant" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="56635488" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="833" name="__module.model.model.layers.5.self_attn/aten::transpose/Transpose" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1196,q.11"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="834" name="__module.model.model.layers.5.self_attn/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="1245"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="835" name="Constant_5993" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635630" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="836" name="Constant_5995" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635638" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="837" name="Constant_5997" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="838" name="__module.model.model.layers.5.self_attn/aten::slice/Slice_1" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="1255,x2.21"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="839" name="Constant_90088_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1, 1" offset="56635654" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="840" name="Constant_90088" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="841" name="__module.model.model.layers.5.self_attn/aten::neg/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="1256"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="842" name="Constant_5890" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="2" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="843" name="Constant_5934" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635630" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="844" name="Constant_5936" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="845" name="__module.model.model.layers.5.self_attn/aten::slice/Slice_2" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="1250"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="846" name="__module.model.model.layers.5.self_attn/aten::cat/Concat" type="Concat" version="opset1"> <data axis="-1" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </input> <output> <port id="2" precision="FP32" names="1258"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="847" name="__module.model.model.layers.5.self_attn/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="1259"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="848" name="__module.model.model.layers.5.self_attn/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="1260"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="849" name="Constant_102338_compressed" type="Const" version="opset1"> <data element_type="f16" shape="" offset="0" size="2" /> <output> <port id="0" precision="FP16" /> </output> </layer> <layer id="850" name="Constant_102338" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16" /> </input> <output> <port id="1" precision="FP32" /> </output> </layer> <layer id="851" name="Constant_102331" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="10" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="852" name="Constant_102333" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="2" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="853" name="Constant_102335" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="18" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="854" name="Concat_102336" type="Concat" version="opset1"> <data axis="0" /> <input> <port id="0" precision="I64"> <dim>1</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="4" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="855" name="Broadcast_102339" type="Broadcast" version="opset3"> <data mode="numpy" /> <input> <port id="0" precision="FP32" /> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>0</dim> <dim>96</dim> </port> </output> </layer> <layer id="856" name="ReadValue_101155" type="ReadValue" version="opset6"> <data variable_id="past_key_values.5.keypresent.5.key" variable_type="f32" variable_shape="?,32,?,96" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>0</dim> <dim>96</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.5.key"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="857" name="Constant_99881" type="Const" version="opset1"> <data element_type="i64" shape="" offset="2" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="858" name="Gather_99882" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="859" name="Constant_5436" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635432" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="860" name="Constant_5438" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635656" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="861" name="Constant_5440" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="862" name="__module.model.model.layers.5.self_attn/aten::slice/Slice_3" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>9216</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="1192,key_states.25"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="863" name="Constant_96609" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="56635456" size="32" /> <rt_info> <attribute name="precise" version="0" /> </rt_info> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="864" name="__module.model.model.layers.5.self_attn/aten::view/Reshape_1" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1198"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> </output> </layer> <layer id="865" name="__module.model.model.layers.5.self_attn/aten::transpose/Constant_1" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="56635488" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="866" name="__module.model.model.layers.5.self_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1199,key_states.27"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="867" name="__module.model.model.layers.5.self_attn/aten::mul/Multiply_2" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="1261"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="868" name="Constant_6136" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635630" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="869" name="Constant_6138" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635638" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="870" name="Constant_6140" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="871" name="__module.model.model.layers.5.self_attn/aten::slice/Slice_4" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="1271,x2.23"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="872" name="Constant_90089_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1, 1" offset="56635654" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="873" name="Constant_90089" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="874" name="__module.model.model.layers.5.self_attn/aten::neg/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="1272"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="875" name="Constant_6033" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="2" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="876" name="Constant_6077" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635630" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="877" name="Constant_6079" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="878" name="__module.model.model.layers.5.self_attn/aten::slice/Slice_5" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="1266"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="879" name="__module.model.model.layers.5.self_attn/aten::cat/Concat_1" type="Concat" version="opset1"> <data axis="-1" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </input> <output> <port id="2" precision="FP32" names="1274"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="880" name="__module.model.model.layers.5.self_attn/aten::mul/Multiply_3" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="1275"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="881" name="__module.model.model.layers.5.self_attn/aten::add/Add_1" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="1276"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="882" name="__module.model.model.layers.5.self_attn/aten::cat/Concat_2" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="hidden_states.129,present.5.key"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="883" name="Constant_102326_compressed" type="Const" version="opset1"> <data element_type="f16" shape="" offset="0" size="2" /> <output> <port id="0" precision="FP16" /> </output> </layer> <layer id="884" name="Constant_102326" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16" /> </input> <output> <port id="1" precision="FP32" /> </output> </layer> <layer id="885" name="Constant_102319" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="10" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="886" name="Constant_102321" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="2" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="887" name="Constant_102323" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="18" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="888" name="Concat_102324" type="Concat" version="opset1"> <data axis="0" /> <input> <port id="0" precision="I64"> <dim>1</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="4" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="889" name="Broadcast_102327" type="Broadcast" version="opset3"> <data mode="numpy" /> <input> <port id="0" precision="FP32" /> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>0</dim> <dim>96</dim> </port> </output> </layer> <layer id="890" name="ReadValue_101157" type="ReadValue" version="opset6"> <data variable_id="past_key_values.5.valuepresent.5.value" variable_type="f32" variable_shape="?,32,?,96" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>0</dim> <dim>96</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.5.value"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="891" name="Constant_99884" type="Const" version="opset1"> <data element_type="i64" shape="" offset="2" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="892" name="Gather_99885" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="893" name="Constant_5446" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635656" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="894" name="Constant_5448" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635638" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="895" name="Constant_5450" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="896" name="__module.model.model.layers.5.self_attn/aten::slice/Slice_6" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>9216</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="1193,value_states.11"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="897" name="Constant_96610" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="56635456" size="32" /> <rt_info> <attribute name="precise" version="0" /> </rt_info> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="898" name="__module.model.model.layers.5.self_attn/aten::view/Reshape_2" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1201"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> </output> </layer> <layer id="899" name="__module.model.model.layers.5.self_attn/aten::transpose/Constant_2" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="56635488" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="900" name="__module.model.model.layers.5.self_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1202"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="901" name="__module.model.model.layers.5.self_attn/aten::cat/Concat_3" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="hidden_states.131,present.5.value"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="902" name="__module.model.model.layers.5.self_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> <data causal="false" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="2" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="3" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>-1</dim> </port> </input> <output> <port id="4" precision="FP32" names="1286,attn_output.21"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="903" name="__module.model.model.layers.5.self_attn/aten::transpose/Constant_3" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="56635488" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="904" name="__module.model.model.layers.5.self_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1287"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> </output> </layer> <layer id="905" name="Constant_96611" type="Const" version="opset1"> <data element_type="i64" shape="3" offset="56635704" size="24" /> <rt_info> <attribute name="precise" version="0" /> </rt_info> <output> <port id="0" precision="I64"> <dim>3</dim> </port> </output> </layer> <layer id="906" name="__module.model.model.layers.5.self_attn/aten::view/Reshape_3" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> <port id="1" precision="I64"> <dim>3</dim> </port> </input> <output> <port id="2" precision="FP32" names="1290"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="907" name="self.model.model.layers.5.self_attn.o_proj.weight_compressed" type="Const" version="opset1"> <data element_type="f16" shape="3072, 3072" offset="1189159252" size="18874368" /> <output> <port id="0" precision="FP16" names="self.model.model.layers.5.self_attn.o_proj.weight"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="908" name="self.model.model.layers.5.self_attn.o_proj.weight" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="909" name="__module.model.model.layers.5.self_attn.o_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="1292,1294,input.31"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="910" name="__module.model.model.layers.5/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="1298,1300,1311,hidden_states.133,hidden_states.135"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="911" name="Constant_90093_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 3072" offset="1208033620" size="6144" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="912" name="Constant_90093" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="913" name="Constant_90092_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12314" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="914" name="Constant_90092" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="915" name="Constant_90090_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12316" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="916" name="Constant_90090" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="917" name="__module.model.model.layers.5.post_attention_layernorm/aten::pow/Power" type="Power" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="1301"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="918" name="Constant_6308" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="12318" size="8" /> <output> <port id="0" precision="I64" names="1302"> <dim>1</dim> </port> </output> </layer> <layer id="919" name="__module.model.model.layers.5.post_attention_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> <data keep_dims="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="1303,variance.23"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="920" name="Constant_90091_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12326" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="921" name="Constant_90091" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="922" name="__module.model.model.layers.5.post_attention_layernorm/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="1304"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="923" name="__module.model.model.layers.5.post_attention_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="924" name="__module.model.model.layers.5.post_attention_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> <data auto_broadcast="numpy" m_pythondiv="true" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="1305"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="925" name="__module.model.model.layers.5.post_attention_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="1306,1307,hidden_states.137,hidden_states.139"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="926" name="__module.model.model.layers.5.post_attention_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="1308,1310"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="927" name="self.model.model.layers.5.mlp.gate_up_proj.weight_compressed" type="Const" version="opset1"> <data element_type="f16" shape="16384, 3072" offset="1208039764" size="100663296" /> <output> <port id="0" precision="FP16" names="self.model.model.layers.5.mlp.gate_up_proj.weight"> <dim>16384</dim> <dim>3072</dim> </port> </output> </layer> <layer id="928" name="self.model.model.layers.5.mlp.gate_up_proj.weight" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>16384</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>16384</dim> <dim>3072</dim> </port> </output> </layer> <layer id="929" name="__module.model.model.layers.5.mlp.gate_up_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>16384</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="1315,up_states.21"> <dim>-1</dim> <dim>-1</dim> <dim>16384</dim> </port> </output> </layer> <layer id="930" name="__module.model.model.layers.5.mlp/prim::ListUnpack/VariadicSplit" type="VariadicSplit" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16384</dim> </port> <port id="1" precision="I64" /> <port id="2" precision="I32"> <dim>2</dim> </port> </input> <output> <port id="3" precision="FP32" names="1317,input.33"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> <port id="4" precision="FP32" names="1318,up_states.23"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> </output> </layer> <layer id="931" name="__module.model.model.layers.5.mlp.activation_fn/aten::silu/Swish" type="Swish" version="opset4"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> </input> <output> <port id="1" precision="FP32" names="1319"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> </output> </layer> <layer id="932" name="__module.model.model.layers.5.mlp/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> </input> <output> <port id="2" precision="FP32" names="1320"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> </output> </layer> <layer id="933" name="self.model.model.layers.5.mlp.down_proj.weight_compressed" type="Const" version="opset1"> <data element_type="f16" shape="3072, 8192" offset="1308703060" size="50331648" /> <output> <port id="0" precision="FP16" names="self.model.model.layers.5.mlp.down_proj.weight"> <dim>3072</dim> <dim>8192</dim> </port> </output> </layer> <layer id="934" name="self.model.model.layers.5.mlp.down_proj.weight" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>8192</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>3072</dim> <dim>8192</dim> </port> </output> </layer> <layer id="935" name="__module.model.model.layers.5.mlp.down_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> <port id="1" precision="FP32"> <dim>3072</dim> <dim>8192</dim> </port> </input> <output> <port id="2" precision="FP32" names="1322,input.35"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="936" name="__module.model.model.layers.5/aten::add/Add_1" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="1324,1326,1334,1345,hidden_states.143,hidden_states.145"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="937" name="Constant_90097_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 3072" offset="1359034708" size="6144" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="938" name="Constant_90097" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="939" name="Constant_90096_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12314" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="940" name="Constant_90096" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="941" name="Constant_90094_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12316" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="942" name="Constant_90094" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="943" name="__module.model.model.layers.6.input_layernorm/aten::pow/Power" type="Power" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="1335"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="944" name="Constant_6377" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="12318" size="8" /> <output> <port id="0" precision="I64" names="1336"> <dim>1</dim> </port> </output> </layer> <layer id="945" name="__module.model.model.layers.6.input_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> <data keep_dims="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="1337,variance.25"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="946" name="Constant_90095_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12326" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="947" name="Constant_90095" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="948" name="__module.model.model.layers.6.input_layernorm/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="1338"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="949" name="__module.model.model.layers.6.input_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="950" name="__module.model.model.layers.6.input_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> <data auto_broadcast="numpy" m_pythondiv="true" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="1339"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="951" name="__module.model.model.layers.6.input_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="1340,1341,hidden_states.147,hidden_states.149"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="952" name="__module.model.model.layers.6.input_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="1342,1344,hidden_states.151"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="953" name="self.model.model.layers.6.self_attn.qkv_proj.weight_compressed" type="Const" version="opset1"> <data element_type="f16" shape="9216, 3072" offset="1359040852" size="56623104" /> <output> <port id="0" precision="FP16" names="self.model.model.layers.6.self_attn.qkv_proj.weight"> <dim>9216</dim> <dim>3072</dim> </port> </output> </layer> <layer id="954" name="self.model.model.layers.6.self_attn.qkv_proj.weight" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>9216</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>9216</dim> <dim>3072</dim> </port> </output> </layer> <layer id="955" name="__module.model.model.layers.6.self_attn.qkv_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>9216</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="1351,qkv.13"> <dim>-1</dim> <dim>-1</dim> <dim>9216</dim> </port> </output> </layer> <layer id="956" name="Constant_6420" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="2" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="957" name="Constant_6422" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635432" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="958" name="Constant_6424" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="959" name="__module.model.model.layers.6.self_attn/aten::slice/Slice" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>9216</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="1352,query_states.13"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="960" name="Constant_96612" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="56635456" size="32" /> <rt_info> <attribute name="precise" version="0" /> </rt_info> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="961" name="__module.model.model.layers.6.self_attn/aten::view/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1356"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> </output> </layer> <layer id="962" name="__module.model.model.layers.6.self_attn/aten::transpose/Constant" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="56635488" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="963" name="__module.model.model.layers.6.self_attn/aten::transpose/Transpose" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1357,q.13"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="964" name="__module.model.model.layers.6.self_attn/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="1406"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="965" name="Constant_6987" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635630" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="966" name="Constant_6989" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635638" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="967" name="Constant_6991" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="968" name="__module.model.model.layers.6.self_attn/aten::slice/Slice_1" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="1416,x2.25"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="969" name="Constant_90098_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1, 1" offset="56635654" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="970" name="Constant_90098" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="971" name="__module.model.model.layers.6.self_attn/aten::neg/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="1417"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="972" name="Constant_6884" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="2" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="973" name="Constant_6928" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635630" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="974" name="Constant_6930" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="975" name="__module.model.model.layers.6.self_attn/aten::slice/Slice_2" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="1411"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="976" name="__module.model.model.layers.6.self_attn/aten::cat/Concat" type="Concat" version="opset1"> <data axis="-1" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </input> <output> <port id="2" precision="FP32" names="1419"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="977" name="__module.model.model.layers.6.self_attn/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="1420"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="978" name="__module.model.model.layers.6.self_attn/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="1421"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="979" name="Constant_102362_compressed" type="Const" version="opset1"> <data element_type="f16" shape="" offset="0" size="2" /> <output> <port id="0" precision="FP16" /> </output> </layer> <layer id="980" name="Constant_102362" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16" /> </input> <output> <port id="1" precision="FP32" /> </output> </layer> <layer id="981" name="Constant_102355" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="10" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="982" name="Constant_102357" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="2" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="983" name="Constant_102359" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="18" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="984" name="Concat_102360" type="Concat" version="opset1"> <data axis="0" /> <input> <port id="0" precision="I64"> <dim>1</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="4" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="985" name="Broadcast_102363" type="Broadcast" version="opset3"> <data mode="numpy" /> <input> <port id="0" precision="FP32" /> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>0</dim> <dim>96</dim> </port> </output> </layer> <layer id="986" name="ReadValue_101159" type="ReadValue" version="opset6"> <data variable_id="past_key_values.6.keypresent.6.key" variable_type="f32" variable_shape="?,32,?,96" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>0</dim> <dim>96</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.6.key"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="987" name="Constant_99887" type="Const" version="opset1"> <data element_type="i64" shape="" offset="2" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="988" name="Gather_99888" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="989" name="Constant_6430" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635432" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="990" name="Constant_6432" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635656" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="991" name="Constant_6434" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="992" name="__module.model.model.layers.6.self_attn/aten::slice/Slice_3" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>9216</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="1353,key_states.29"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="993" name="Constant_96613" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="56635456" size="32" /> <rt_info> <attribute name="precise" version="0" /> </rt_info> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="994" name="__module.model.model.layers.6.self_attn/aten::view/Reshape_1" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1359"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> </output> </layer> <layer id="995" name="__module.model.model.layers.6.self_attn/aten::transpose/Constant_1" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="56635488" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="996" name="__module.model.model.layers.6.self_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1360,key_states.31"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="997" name="__module.model.model.layers.6.self_attn/aten::mul/Multiply_2" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="1422"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="998" name="Constant_7130" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635630" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="999" name="Constant_7132" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635638" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1000" name="Constant_7134" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1001" name="__module.model.model.layers.6.self_attn/aten::slice/Slice_4" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="1432,x2.27"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="1002" name="Constant_90099_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1, 1" offset="56635654" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1003" name="Constant_90099" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1004" name="__module.model.model.layers.6.self_attn/aten::neg/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="1433"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="1005" name="Constant_7027" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="2" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1006" name="Constant_7071" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635630" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1007" name="Constant_7073" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1008" name="__module.model.model.layers.6.self_attn/aten::slice/Slice_5" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="1427"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="1009" name="__module.model.model.layers.6.self_attn/aten::cat/Concat_1" type="Concat" version="opset1"> <data axis="-1" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </input> <output> <port id="2" precision="FP32" names="1435"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="1010" name="__module.model.model.layers.6.self_attn/aten::mul/Multiply_3" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="1436"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="1011" name="__module.model.model.layers.6.self_attn/aten::add/Add_1" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="1437"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="1012" name="__module.model.model.layers.6.self_attn/aten::cat/Concat_2" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="hidden_states.153,present.6.key"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="1013" name="Constant_102350_compressed" type="Const" version="opset1"> <data element_type="f16" shape="" offset="0" size="2" /> <output> <port id="0" precision="FP16" /> </output> </layer> <layer id="1014" name="Constant_102350" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16" /> </input> <output> <port id="1" precision="FP32" /> </output> </layer> <layer id="1015" name="Constant_102343" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="10" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1016" name="Constant_102345" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="2" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1017" name="Constant_102347" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="18" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1018" name="Concat_102348" type="Concat" version="opset1"> <data axis="0" /> <input> <port id="0" precision="I64"> <dim>1</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="4" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="1019" name="Broadcast_102351" type="Broadcast" version="opset3"> <data mode="numpy" /> <input> <port id="0" precision="FP32" /> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>0</dim> <dim>96</dim> </port> </output> </layer> <layer id="1020" name="ReadValue_101161" type="ReadValue" version="opset6"> <data variable_id="past_key_values.6.valuepresent.6.value" variable_type="f32" variable_shape="?,32,?,96" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>0</dim> <dim>96</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.6.value"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="1021" name="Constant_99890" type="Const" version="opset1"> <data element_type="i64" shape="" offset="2" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="1022" name="Gather_99891" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="1023" name="Constant_6440" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635656" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1024" name="Constant_6442" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635638" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1025" name="Constant_6444" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1026" name="__module.model.model.layers.6.self_attn/aten::slice/Slice_6" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>9216</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="1354,value_states.13"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1027" name="Constant_96614" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="56635456" size="32" /> <rt_info> <attribute name="precise" version="0" /> </rt_info> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="1028" name="__module.model.model.layers.6.self_attn/aten::view/Reshape_2" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1362"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> </output> </layer> <layer id="1029" name="__module.model.model.layers.6.self_attn/aten::transpose/Constant_2" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="56635488" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="1030" name="__module.model.model.layers.6.self_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1363"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="1031" name="__module.model.model.layers.6.self_attn/aten::cat/Concat_3" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="hidden_states.155,present.6.value"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="1032" name="__module.model.model.layers.6.self_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> <data causal="false" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="2" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="3" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>-1</dim> </port> </input> <output> <port id="4" precision="FP32" names="1447,attn_output.25"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="1033" name="__module.model.model.layers.6.self_attn/aten::transpose/Constant_3" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="56635488" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="1034" name="__module.model.model.layers.6.self_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1448"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> </output> </layer> <layer id="1035" name="Constant_96615" type="Const" version="opset1"> <data element_type="i64" shape="3" offset="56635704" size="24" /> <rt_info> <attribute name="precise" version="0" /> </rt_info> <output> <port id="0" precision="I64"> <dim>3</dim> </port> </output> </layer> <layer id="1036" name="__module.model.model.layers.6.self_attn/aten::view/Reshape_3" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> <port id="1" precision="I64"> <dim>3</dim> </port> </input> <output> <port id="2" precision="FP32" names="1451"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1037" name="self.model.model.layers.6.self_attn.o_proj.weight_compressed" type="Const" version="opset1"> <data element_type="f16" shape="3072, 3072" offset="1415663956" size="18874368" /> <output> <port id="0" precision="FP16" names="self.model.model.layers.6.self_attn.o_proj.weight"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1038" name="self.model.model.layers.6.self_attn.o_proj.weight" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1039" name="__module.model.model.layers.6.self_attn.o_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="1453,1455,input.37"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1040" name="__module.model.model.layers.6/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="1459,1461,1472,hidden_states.157,hidden_states.159"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1041" name="Constant_90103_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 3072" offset="1434538324" size="6144" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1042" name="Constant_90103" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1043" name="Constant_90102_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12314" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1044" name="Constant_90102" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1045" name="Constant_90100_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12316" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1046" name="Constant_90100" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1047" name="__module.model.model.layers.6.post_attention_layernorm/aten::pow/Power" type="Power" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="1462"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1048" name="Constant_7302" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="12318" size="8" /> <output> <port id="0" precision="I64" names="1463"> <dim>1</dim> </port> </output> </layer> <layer id="1049" name="__module.model.model.layers.6.post_attention_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> <data keep_dims="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="1464,variance.27"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1050" name="Constant_90101_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12326" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1051" name="Constant_90101" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1052" name="__module.model.model.layers.6.post_attention_layernorm/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="1465"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1053" name="__module.model.model.layers.6.post_attention_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1054" name="__module.model.model.layers.6.post_attention_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> <data auto_broadcast="numpy" m_pythondiv="true" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="1466"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1055" name="__module.model.model.layers.6.post_attention_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="1467,1468,hidden_states.161,hidden_states.163"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1056" name="__module.model.model.layers.6.post_attention_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="1469,1471"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1057" name="self.model.model.layers.6.mlp.gate_up_proj.weight_compressed" type="Const" version="opset1"> <data element_type="f16" shape="16384, 3072" offset="1434544468" size="100663296" /> <output> <port id="0" precision="FP16" names="self.model.model.layers.6.mlp.gate_up_proj.weight"> <dim>16384</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1058" name="self.model.model.layers.6.mlp.gate_up_proj.weight" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>16384</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>16384</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1059" name="__module.model.model.layers.6.mlp.gate_up_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>16384</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="1476,up_states.25"> <dim>-1</dim> <dim>-1</dim> <dim>16384</dim> </port> </output> </layer> <layer id="1060" name="__module.model.model.layers.6.mlp/prim::ListUnpack/VariadicSplit" type="VariadicSplit" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16384</dim> </port> <port id="1" precision="I64" /> <port id="2" precision="I32"> <dim>2</dim> </port> </input> <output> <port id="3" precision="FP32" names="1478,input.39"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> <port id="4" precision="FP32" names="1479,up_states.27"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> </output> </layer> <layer id="1061" name="__module.model.model.layers.6.mlp.activation_fn/aten::silu/Swish" type="Swish" version="opset4"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> </input> <output> <port id="1" precision="FP32" names="1480"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> </output> </layer> <layer id="1062" name="__module.model.model.layers.6.mlp/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> </input> <output> <port id="2" precision="FP32" names="1481"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> </output> </layer> <layer id="1063" name="self.model.model.layers.6.mlp.down_proj.weight_compressed" type="Const" version="opset1"> <data element_type="f16" shape="3072, 8192" offset="1535207764" size="50331648" /> <output> <port id="0" precision="FP16" names="self.model.model.layers.6.mlp.down_proj.weight"> <dim>3072</dim> <dim>8192</dim> </port> </output> </layer> <layer id="1064" name="self.model.model.layers.6.mlp.down_proj.weight" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>8192</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>3072</dim> <dim>8192</dim> </port> </output> </layer> <layer id="1065" name="__module.model.model.layers.6.mlp.down_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> <port id="1" precision="FP32"> <dim>3072</dim> <dim>8192</dim> </port> </input> <output> <port id="2" precision="FP32" names="1483,input.41"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1066" name="__module.model.model.layers.6/aten::add/Add_1" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="1485,1487,1495,1506,hidden_states.167,hidden_states.169"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1067" name="Constant_90107_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 3072" offset="1585539412" size="6144" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1068" name="Constant_90107" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1069" name="Constant_90106_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12314" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1070" name="Constant_90106" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1071" name="Constant_90104_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12316" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1072" name="Constant_90104" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1073" name="__module.model.model.layers.7.input_layernorm/aten::pow/Power" type="Power" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="1496"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1074" name="Constant_7371" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="12318" size="8" /> <output> <port id="0" precision="I64" names="1497"> <dim>1</dim> </port> </output> </layer> <layer id="1075" name="__module.model.model.layers.7.input_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> <data keep_dims="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="1498,variance.29"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1076" name="Constant_90105_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12326" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1077" name="Constant_90105" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1078" name="__module.model.model.layers.7.input_layernorm/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="1499"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1079" name="__module.model.model.layers.7.input_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1080" name="__module.model.model.layers.7.input_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> <data auto_broadcast="numpy" m_pythondiv="true" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="1500"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1081" name="__module.model.model.layers.7.input_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="1501,1502,hidden_states.171,hidden_states.173"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1082" name="__module.model.model.layers.7.input_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="1503,1505,hidden_states.175"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1083" name="self.model.model.layers.7.self_attn.qkv_proj.weight_compressed" type="Const" version="opset1"> <data element_type="f16" shape="9216, 3072" offset="1585545556" size="56623104" /> <output> <port id="0" precision="FP16" names="self.model.model.layers.7.self_attn.qkv_proj.weight"> <dim>9216</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1084" name="self.model.model.layers.7.self_attn.qkv_proj.weight" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>9216</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>9216</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1085" name="__module.model.model.layers.7.self_attn.qkv_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>9216</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="1512,qkv.15"> <dim>-1</dim> <dim>-1</dim> <dim>9216</dim> </port> </output> </layer> <layer id="1086" name="Constant_7414" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="2" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1087" name="Constant_7416" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635432" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1088" name="Constant_7418" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1089" name="__module.model.model.layers.7.self_attn/aten::slice/Slice" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>9216</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="1513,query_states.15"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1090" name="Constant_96616" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="56635456" size="32" /> <rt_info> <attribute name="precise" version="0" /> </rt_info> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="1091" name="__module.model.model.layers.7.self_attn/aten::view/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1517"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> </output> </layer> <layer id="1092" name="__module.model.model.layers.7.self_attn/aten::transpose/Constant" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="56635488" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="1093" name="__module.model.model.layers.7.self_attn/aten::transpose/Transpose" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1518,q.15"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="1094" name="__module.model.model.layers.7.self_attn/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="1567"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="1095" name="Constant_7981" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635630" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1096" name="Constant_7983" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635638" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1097" name="Constant_7985" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1098" name="__module.model.model.layers.7.self_attn/aten::slice/Slice_1" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="1577,x2.29"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="1099" name="Constant_90108_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1, 1" offset="56635654" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1100" name="Constant_90108" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1101" name="__module.model.model.layers.7.self_attn/aten::neg/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="1578"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="1102" name="Constant_7878" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="2" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1103" name="Constant_7922" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635630" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1104" name="Constant_7924" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1105" name="__module.model.model.layers.7.self_attn/aten::slice/Slice_2" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="1572"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="1106" name="__module.model.model.layers.7.self_attn/aten::cat/Concat" type="Concat" version="opset1"> <data axis="-1" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </input> <output> <port id="2" precision="FP32" names="1580"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="1107" name="__module.model.model.layers.7.self_attn/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="1581"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="1108" name="__module.model.model.layers.7.self_attn/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="1582"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="1109" name="Constant_102386_compressed" type="Const" version="opset1"> <data element_type="f16" shape="" offset="0" size="2" /> <output> <port id="0" precision="FP16" /> </output> </layer> <layer id="1110" name="Constant_102386" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16" /> </input> <output> <port id="1" precision="FP32" /> </output> </layer> <layer id="1111" name="Constant_102379" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="10" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1112" name="Constant_102381" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="2" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1113" name="Constant_102383" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="18" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1114" name="Concat_102384" type="Concat" version="opset1"> <data axis="0" /> <input> <port id="0" precision="I64"> <dim>1</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="4" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="1115" name="Broadcast_102387" type="Broadcast" version="opset3"> <data mode="numpy" /> <input> <port id="0" precision="FP32" /> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>0</dim> <dim>96</dim> </port> </output> </layer> <layer id="1116" name="ReadValue_101163" type="ReadValue" version="opset6"> <data variable_id="past_key_values.7.keypresent.7.key" variable_type="f32" variable_shape="?,32,?,96" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>0</dim> <dim>96</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.7.key"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="1117" name="Constant_99893" type="Const" version="opset1"> <data element_type="i64" shape="" offset="2" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="1118" name="Gather_99894" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="1119" name="Constant_7424" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635432" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1120" name="Constant_7426" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635656" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1121" name="Constant_7428" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1122" name="__module.model.model.layers.7.self_attn/aten::slice/Slice_3" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>9216</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="1514,key_states.33"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1123" name="Constant_96617" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="56635456" size="32" /> <rt_info> <attribute name="precise" version="0" /> </rt_info> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="1124" name="__module.model.model.layers.7.self_attn/aten::view/Reshape_1" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1520"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> </output> </layer> <layer id="1125" name="__module.model.model.layers.7.self_attn/aten::transpose/Constant_1" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="56635488" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="1126" name="__module.model.model.layers.7.self_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1521,key_states.35"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="1127" name="__module.model.model.layers.7.self_attn/aten::mul/Multiply_2" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="1583"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="1128" name="Constant_8124" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635630" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1129" name="Constant_8126" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635638" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1130" name="Constant_8128" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1131" name="__module.model.model.layers.7.self_attn/aten::slice/Slice_4" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="1593,x2.31"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="1132" name="Constant_90109_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1, 1" offset="56635654" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1133" name="Constant_90109" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1134" name="__module.model.model.layers.7.self_attn/aten::neg/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="1594"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="1135" name="Constant_8021" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="2" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1136" name="Constant_8065" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635630" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1137" name="Constant_8067" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1138" name="__module.model.model.layers.7.self_attn/aten::slice/Slice_5" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="1588"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="1139" name="__module.model.model.layers.7.self_attn/aten::cat/Concat_1" type="Concat" version="opset1"> <data axis="-1" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </input> <output> <port id="2" precision="FP32" names="1596"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="1140" name="__module.model.model.layers.7.self_attn/aten::mul/Multiply_3" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="1597"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="1141" name="__module.model.model.layers.7.self_attn/aten::add/Add_1" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="1598"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="1142" name="__module.model.model.layers.7.self_attn/aten::cat/Concat_2" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="hidden_states.177,present.7.key"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="1143" name="Constant_102374_compressed" type="Const" version="opset1"> <data element_type="f16" shape="" offset="0" size="2" /> <output> <port id="0" precision="FP16" /> </output> </layer> <layer id="1144" name="Constant_102374" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16" /> </input> <output> <port id="1" precision="FP32" /> </output> </layer> <layer id="1145" name="Constant_102367" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="10" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1146" name="Constant_102369" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="2" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1147" name="Constant_102371" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="18" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1148" name="Concat_102372" type="Concat" version="opset1"> <data axis="0" /> <input> <port id="0" precision="I64"> <dim>1</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="4" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="1149" name="Broadcast_102375" type="Broadcast" version="opset3"> <data mode="numpy" /> <input> <port id="0" precision="FP32" /> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>0</dim> <dim>96</dim> </port> </output> </layer> <layer id="1150" name="ReadValue_101165" type="ReadValue" version="opset6"> <data variable_id="past_key_values.7.valuepresent.7.value" variable_type="f32" variable_shape="?,32,?,96" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>0</dim> <dim>96</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.7.value"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="1151" name="Constant_99896" type="Const" version="opset1"> <data element_type="i64" shape="" offset="2" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="1152" name="Gather_99897" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="1153" name="Constant_7434" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635656" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1154" name="Constant_7436" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635638" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1155" name="Constant_7438" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1156" name="__module.model.model.layers.7.self_attn/aten::slice/Slice_6" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>9216</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="1515,value_states.15"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1157" name="Constant_96618" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="56635456" size="32" /> <rt_info> <attribute name="precise" version="0" /> </rt_info> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="1158" name="__module.model.model.layers.7.self_attn/aten::view/Reshape_2" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1523"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> </output> </layer> <layer id="1159" name="__module.model.model.layers.7.self_attn/aten::transpose/Constant_2" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="56635488" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="1160" name="__module.model.model.layers.7.self_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1524"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="1161" name="__module.model.model.layers.7.self_attn/aten::cat/Concat_3" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="hidden_states.179,present.7.value"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="1162" name="__module.model.model.layers.7.self_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> <data causal="false" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="2" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="3" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>-1</dim> </port> </input> <output> <port id="4" precision="FP32" names="1608,attn_output.29"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="1163" name="__module.model.model.layers.7.self_attn/aten::transpose/Constant_3" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="56635488" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="1164" name="__module.model.model.layers.7.self_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1609"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> </output> </layer> <layer id="1165" name="Constant_96619" type="Const" version="opset1"> <data element_type="i64" shape="3" offset="56635704" size="24" /> <rt_info> <attribute name="precise" version="0" /> </rt_info> <output> <port id="0" precision="I64"> <dim>3</dim> </port> </output> </layer> <layer id="1166" name="__module.model.model.layers.7.self_attn/aten::view/Reshape_3" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> <port id="1" precision="I64"> <dim>3</dim> </port> </input> <output> <port id="2" precision="FP32" names="1612"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1167" name="self.model.model.layers.7.self_attn.o_proj.weight_compressed" type="Const" version="opset1"> <data element_type="f16" shape="3072, 3072" offset="1642168660" size="18874368" /> <output> <port id="0" precision="FP16" names="self.model.model.layers.7.self_attn.o_proj.weight"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1168" name="self.model.model.layers.7.self_attn.o_proj.weight" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1169" name="__module.model.model.layers.7.self_attn.o_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="1614,1616,input.43"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1170" name="__module.model.model.layers.7/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="1620,1622,1633,hidden_states.181,hidden_states.183"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1171" name="Constant_90113_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 3072" offset="1661043028" size="6144" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1172" name="Constant_90113" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1173" name="Constant_90112_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12314" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1174" name="Constant_90112" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1175" name="Constant_90110_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12316" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1176" name="Constant_90110" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1177" name="__module.model.model.layers.7.post_attention_layernorm/aten::pow/Power" type="Power" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="1623"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1178" name="Constant_8296" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="12318" size="8" /> <output> <port id="0" precision="I64" names="1624"> <dim>1</dim> </port> </output> </layer> <layer id="1179" name="__module.model.model.layers.7.post_attention_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> <data keep_dims="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="1625,variance.31"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1180" name="Constant_90111_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12326" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1181" name="Constant_90111" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1182" name="__module.model.model.layers.7.post_attention_layernorm/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="1626"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1183" name="__module.model.model.layers.7.post_attention_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1184" name="__module.model.model.layers.7.post_attention_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> <data auto_broadcast="numpy" m_pythondiv="true" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="1627"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1185" name="__module.model.model.layers.7.post_attention_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="1628,1629,hidden_states.185,hidden_states.187"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1186" name="__module.model.model.layers.7.post_attention_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="1630,1632"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1187" name="self.model.model.layers.7.mlp.gate_up_proj.weight_compressed" type="Const" version="opset1"> <data element_type="f16" shape="16384, 3072" offset="1661049172" size="100663296" /> <output> <port id="0" precision="FP16" names="self.model.model.layers.7.mlp.gate_up_proj.weight"> <dim>16384</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1188" name="self.model.model.layers.7.mlp.gate_up_proj.weight" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>16384</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>16384</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1189" name="__module.model.model.layers.7.mlp.gate_up_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>16384</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="1637,up_states.29"> <dim>-1</dim> <dim>-1</dim> <dim>16384</dim> </port> </output> </layer> <layer id="1190" name="__module.model.model.layers.7.mlp/prim::ListUnpack/VariadicSplit" type="VariadicSplit" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16384</dim> </port> <port id="1" precision="I64" /> <port id="2" precision="I32"> <dim>2</dim> </port> </input> <output> <port id="3" precision="FP32" names="1639,input.45"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> <port id="4" precision="FP32" names="1640,up_states.31"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> </output> </layer> <layer id="1191" name="__module.model.model.layers.7.mlp.activation_fn/aten::silu/Swish" type="Swish" version="opset4"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> </input> <output> <port id="1" precision="FP32" names="1641"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> </output> </layer> <layer id="1192" name="__module.model.model.layers.7.mlp/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> </input> <output> <port id="2" precision="FP32" names="1642"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> </output> </layer> <layer id="1193" name="self.model.model.layers.7.mlp.down_proj.weight_compressed" type="Const" version="opset1"> <data element_type="f16" shape="3072, 8192" offset="1761712468" size="50331648" /> <output> <port id="0" precision="FP16" names="self.model.model.layers.7.mlp.down_proj.weight"> <dim>3072</dim> <dim>8192</dim> </port> </output> </layer> <layer id="1194" name="self.model.model.layers.7.mlp.down_proj.weight" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>8192</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>3072</dim> <dim>8192</dim> </port> </output> </layer> <layer id="1195" name="__module.model.model.layers.7.mlp.down_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> <port id="1" precision="FP32"> <dim>3072</dim> <dim>8192</dim> </port> </input> <output> <port id="2" precision="FP32" names="1644,input.47"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1196" name="__module.model.model.layers.7/aten::add/Add_1" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="1646,1648,1656,1667,hidden_states.191,hidden_states.193"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1197" name="Constant_90117_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 3072" offset="1812044116" size="6144" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1198" name="Constant_90117" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1199" name="Constant_90116_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12314" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1200" name="Constant_90116" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1201" name="Constant_90114_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12316" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1202" name="Constant_90114" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1203" name="__module.model.model.layers.8.input_layernorm/aten::pow/Power" type="Power" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="1657"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1204" name="Constant_8365" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="12318" size="8" /> <output> <port id="0" precision="I64" names="1658"> <dim>1</dim> </port> </output> </layer> <layer id="1205" name="__module.model.model.layers.8.input_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> <data keep_dims="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="1659,variance.33"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1206" name="Constant_90115_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12326" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1207" name="Constant_90115" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1208" name="__module.model.model.layers.8.input_layernorm/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="1660"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1209" name="__module.model.model.layers.8.input_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1210" name="__module.model.model.layers.8.input_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> <data auto_broadcast="numpy" m_pythondiv="true" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="1661"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1211" name="__module.model.model.layers.8.input_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="1662,1663,hidden_states.195,hidden_states.197"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1212" name="__module.model.model.layers.8.input_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="1664,1666,hidden_states.199"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1213" name="self.model.model.layers.8.self_attn.qkv_proj.weight_compressed" type="Const" version="opset1"> <data element_type="f16" shape="9216, 3072" offset="1812050260" size="56623104" /> <output> <port id="0" precision="FP16" names="self.model.model.layers.8.self_attn.qkv_proj.weight"> <dim>9216</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1214" name="self.model.model.layers.8.self_attn.qkv_proj.weight" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>9216</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>9216</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1215" name="__module.model.model.layers.8.self_attn.qkv_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>9216</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="1673,qkv.17"> <dim>-1</dim> <dim>-1</dim> <dim>9216</dim> </port> </output> </layer> <layer id="1216" name="Constant_8408" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="2" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1217" name="Constant_8410" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635432" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1218" name="Constant_8412" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1219" name="__module.model.model.layers.8.self_attn/aten::slice/Slice" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>9216</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="1674,query_states.17"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1220" name="Constant_96620" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="56635456" size="32" /> <rt_info> <attribute name="precise" version="0" /> </rt_info> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="1221" name="__module.model.model.layers.8.self_attn/aten::view/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1678"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> </output> </layer> <layer id="1222" name="__module.model.model.layers.8.self_attn/aten::transpose/Constant" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="56635488" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="1223" name="__module.model.model.layers.8.self_attn/aten::transpose/Transpose" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1679,q.17"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="1224" name="__module.model.model.layers.8.self_attn/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="1728"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="1225" name="Constant_8975" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635630" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1226" name="Constant_8977" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635638" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1227" name="Constant_8979" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1228" name="__module.model.model.layers.8.self_attn/aten::slice/Slice_1" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="1738,x2.33"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="1229" name="Constant_90118_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1, 1" offset="56635654" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1230" name="Constant_90118" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1231" name="__module.model.model.layers.8.self_attn/aten::neg/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="1739"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="1232" name="Constant_8872" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="2" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1233" name="Constant_8916" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635630" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1234" name="Constant_8918" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1235" name="__module.model.model.layers.8.self_attn/aten::slice/Slice_2" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="1733"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="1236" name="__module.model.model.layers.8.self_attn/aten::cat/Concat" type="Concat" version="opset1"> <data axis="-1" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </input> <output> <port id="2" precision="FP32" names="1741"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="1237" name="__module.model.model.layers.8.self_attn/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="1742"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="1238" name="__module.model.model.layers.8.self_attn/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="1743"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="1239" name="Constant_102410_compressed" type="Const" version="opset1"> <data element_type="f16" shape="" offset="0" size="2" /> <output> <port id="0" precision="FP16" /> </output> </layer> <layer id="1240" name="Constant_102410" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16" /> </input> <output> <port id="1" precision="FP32" /> </output> </layer> <layer id="1241" name="Constant_102403" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="10" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1242" name="Constant_102405" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="2" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1243" name="Constant_102407" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="18" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1244" name="Concat_102408" type="Concat" version="opset1"> <data axis="0" /> <input> <port id="0" precision="I64"> <dim>1</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="4" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="1245" name="Broadcast_102411" type="Broadcast" version="opset3"> <data mode="numpy" /> <input> <port id="0" precision="FP32" /> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>0</dim> <dim>96</dim> </port> </output> </layer> <layer id="1246" name="ReadValue_101167" type="ReadValue" version="opset6"> <data variable_id="past_key_values.8.keypresent.8.key" variable_type="f32" variable_shape="?,32,?,96" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>0</dim> <dim>96</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.8.key"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="1247" name="Constant_99899" type="Const" version="opset1"> <data element_type="i64" shape="" offset="2" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="1248" name="Gather_99900" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="1249" name="Constant_8418" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635432" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1250" name="Constant_8420" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635656" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1251" name="Constant_8422" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1252" name="__module.model.model.layers.8.self_attn/aten::slice/Slice_3" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>9216</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="1675,key_states.37"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1253" name="Constant_96621" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="56635456" size="32" /> <rt_info> <attribute name="precise" version="0" /> </rt_info> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="1254" name="__module.model.model.layers.8.self_attn/aten::view/Reshape_1" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1681"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> </output> </layer> <layer id="1255" name="__module.model.model.layers.8.self_attn/aten::transpose/Constant_1" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="56635488" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="1256" name="__module.model.model.layers.8.self_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1682,key_states.39"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="1257" name="__module.model.model.layers.8.self_attn/aten::mul/Multiply_2" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="1744"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="1258" name="Constant_9118" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635630" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1259" name="Constant_9120" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635638" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1260" name="Constant_9122" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1261" name="__module.model.model.layers.8.self_attn/aten::slice/Slice_4" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="1754,x2.35"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="1262" name="Constant_90119_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1, 1" offset="56635654" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1263" name="Constant_90119" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1264" name="__module.model.model.layers.8.self_attn/aten::neg/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="1755"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="1265" name="Constant_9015" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="2" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1266" name="Constant_9059" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635630" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1267" name="Constant_9061" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1268" name="__module.model.model.layers.8.self_attn/aten::slice/Slice_5" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="1749"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="1269" name="__module.model.model.layers.8.self_attn/aten::cat/Concat_1" type="Concat" version="opset1"> <data axis="-1" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </input> <output> <port id="2" precision="FP32" names="1757"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="1270" name="__module.model.model.layers.8.self_attn/aten::mul/Multiply_3" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="1758"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="1271" name="__module.model.model.layers.8.self_attn/aten::add/Add_1" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="1759"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="1272" name="__module.model.model.layers.8.self_attn/aten::cat/Concat_2" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="hidden_states.201,present.8.key"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="1273" name="Constant_102398_compressed" type="Const" version="opset1"> <data element_type="f16" shape="" offset="0" size="2" /> <output> <port id="0" precision="FP16" /> </output> </layer> <layer id="1274" name="Constant_102398" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16" /> </input> <output> <port id="1" precision="FP32" /> </output> </layer> <layer id="1275" name="Constant_102391" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="10" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1276" name="Constant_102393" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="2" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1277" name="Constant_102395" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="18" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1278" name="Concat_102396" type="Concat" version="opset1"> <data axis="0" /> <input> <port id="0" precision="I64"> <dim>1</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="4" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="1279" name="Broadcast_102399" type="Broadcast" version="opset3"> <data mode="numpy" /> <input> <port id="0" precision="FP32" /> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>0</dim> <dim>96</dim> </port> </output> </layer> <layer id="1280" name="ReadValue_101169" type="ReadValue" version="opset6"> <data variable_id="past_key_values.8.valuepresent.8.value" variable_type="f32" variable_shape="?,32,?,96" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>0</dim> <dim>96</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.8.value"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="1281" name="Constant_99902" type="Const" version="opset1"> <data element_type="i64" shape="" offset="2" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="1282" name="Gather_99903" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="1283" name="Constant_8428" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635656" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1284" name="Constant_8430" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635638" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1285" name="Constant_8432" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1286" name="__module.model.model.layers.8.self_attn/aten::slice/Slice_6" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>9216</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="1676,value_states.17"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1287" name="Constant_96622" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="56635456" size="32" /> <rt_info> <attribute name="precise" version="0" /> </rt_info> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="1288" name="__module.model.model.layers.8.self_attn/aten::view/Reshape_2" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1684"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> </output> </layer> <layer id="1289" name="__module.model.model.layers.8.self_attn/aten::transpose/Constant_2" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="56635488" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="1290" name="__module.model.model.layers.8.self_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1685"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="1291" name="__module.model.model.layers.8.self_attn/aten::cat/Concat_3" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="hidden_states.203,present.8.value"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="1292" name="__module.model.model.layers.8.self_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> <data causal="false" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="2" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="3" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>-1</dim> </port> </input> <output> <port id="4" precision="FP32" names="1769,attn_output.33"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="1293" name="__module.model.model.layers.8.self_attn/aten::transpose/Constant_3" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="56635488" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="1294" name="__module.model.model.layers.8.self_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1770"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> </output> </layer> <layer id="1295" name="Constant_96623" type="Const" version="opset1"> <data element_type="i64" shape="3" offset="56635704" size="24" /> <rt_info> <attribute name="precise" version="0" /> </rt_info> <output> <port id="0" precision="I64"> <dim>3</dim> </port> </output> </layer> <layer id="1296" name="__module.model.model.layers.8.self_attn/aten::view/Reshape_3" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> <port id="1" precision="I64"> <dim>3</dim> </port> </input> <output> <port id="2" precision="FP32" names="1773"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1297" name="self.model.model.layers.8.self_attn.o_proj.weight_compressed" type="Const" version="opset1"> <data element_type="f16" shape="3072, 3072" offset="1868673364" size="18874368" /> <output> <port id="0" precision="FP16" names="self.model.model.layers.8.self_attn.o_proj.weight"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1298" name="self.model.model.layers.8.self_attn.o_proj.weight" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1299" name="__module.model.model.layers.8.self_attn.o_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="1775,1777,input.49"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1300" name="__module.model.model.layers.8/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="1781,1783,1794,hidden_states.205,hidden_states.207"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1301" name="Constant_90123_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 3072" offset="1887547732" size="6144" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1302" name="Constant_90123" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1303" name="Constant_90122_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12314" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1304" name="Constant_90122" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1305" name="Constant_90120_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12316" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1306" name="Constant_90120" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1307" name="__module.model.model.layers.8.post_attention_layernorm/aten::pow/Power" type="Power" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="1784"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1308" name="Constant_9290" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="12318" size="8" /> <output> <port id="0" precision="I64" names="1785"> <dim>1</dim> </port> </output> </layer> <layer id="1309" name="__module.model.model.layers.8.post_attention_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> <data keep_dims="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="1786,variance.35"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1310" name="Constant_90121_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12326" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1311" name="Constant_90121" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1312" name="__module.model.model.layers.8.post_attention_layernorm/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="1787"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1313" name="__module.model.model.layers.8.post_attention_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1314" name="__module.model.model.layers.8.post_attention_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> <data auto_broadcast="numpy" m_pythondiv="true" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="1788"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1315" name="__module.model.model.layers.8.post_attention_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="1789,1790,hidden_states.209,hidden_states.211"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1316" name="__module.model.model.layers.8.post_attention_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="1791,1793"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1317" name="self.model.model.layers.8.mlp.gate_up_proj.weight_compressed" type="Const" version="opset1"> <data element_type="f16" shape="16384, 3072" offset="1887553876" size="100663296" /> <output> <port id="0" precision="FP16" names="self.model.model.layers.8.mlp.gate_up_proj.weight"> <dim>16384</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1318" name="self.model.model.layers.8.mlp.gate_up_proj.weight" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>16384</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>16384</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1319" name="__module.model.model.layers.8.mlp.gate_up_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>16384</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="1798,up_states.33"> <dim>-1</dim> <dim>-1</dim> <dim>16384</dim> </port> </output> </layer> <layer id="1320" name="__module.model.model.layers.8.mlp/prim::ListUnpack/VariadicSplit" type="VariadicSplit" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16384</dim> </port> <port id="1" precision="I64" /> <port id="2" precision="I32"> <dim>2</dim> </port> </input> <output> <port id="3" precision="FP32" names="1800,input.51"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> <port id="4" precision="FP32" names="1801,up_states.35"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> </output> </layer> <layer id="1321" name="__module.model.model.layers.8.mlp.activation_fn/aten::silu/Swish" type="Swish" version="opset4"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> </input> <output> <port id="1" precision="FP32" names="1802"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> </output> </layer> <layer id="1322" name="__module.model.model.layers.8.mlp/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> </input> <output> <port id="2" precision="FP32" names="1803"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> </output> </layer> <layer id="1323" name="self.model.model.layers.8.mlp.down_proj.weight_compressed" type="Const" version="opset1"> <data element_type="f16" shape="3072, 8192" offset="1988217172" size="50331648" /> <output> <port id="0" precision="FP16" names="self.model.model.layers.8.mlp.down_proj.weight"> <dim>3072</dim> <dim>8192</dim> </port> </output> </layer> <layer id="1324" name="self.model.model.layers.8.mlp.down_proj.weight" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>8192</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>3072</dim> <dim>8192</dim> </port> </output> </layer> <layer id="1325" name="__module.model.model.layers.8.mlp.down_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> <port id="1" precision="FP32"> <dim>3072</dim> <dim>8192</dim> </port> </input> <output> <port id="2" precision="FP32" names="1805,input.53"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1326" name="__module.model.model.layers.8/aten::add/Add_1" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="1807,1809,1817,1828,hidden_states.215,hidden_states.217"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1327" name="Constant_90126_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12314" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1328" name="Constant_90126" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1329" name="Constant_90124_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12316" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1330" name="Constant_90124" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1331" name="__module.model.model.layers.9.input_layernorm/aten::pow/Power" type="Power" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="1818"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1332" name="Constant_9359" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="12318" size="8" /> <output> <port id="0" precision="I64" names="1819"> <dim>1</dim> </port> </output> </layer> <layer id="1333" name="__module.model.model.layers.9.input_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> <data keep_dims="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="1820,variance.37"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1334" name="Constant_90125_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12326" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1335" name="Constant_90125" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1336" name="__module.model.model.layers.9.input_layernorm/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="1821"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1337" name="__module.model.model.layers.9.input_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1338" name="__module.model.model.layers.9.input_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> <data auto_broadcast="numpy" m_pythondiv="true" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="1822"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1339" name="__module.model.model.layers.9.input_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="1823,1824,hidden_states.219,hidden_states.221"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1340" name="__module.model.model.layers.9.input_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="1825,1827,hidden_states.223"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1341" name="self.model.model.layers.9.self_attn.qkv_proj.weight_compressed" type="Const" version="opset1"> <data element_type="f16" shape="9216, 3072" offset="2038548820" size="56623104" /> <output> <port id="0" precision="FP16" names="self.model.model.layers.9.self_attn.qkv_proj.weight"> <dim>9216</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1342" name="self.model.model.layers.9.self_attn.qkv_proj.weight" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>9216</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>9216</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1343" name="__module.model.model.layers.9.self_attn.qkv_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>9216</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="1834,qkv.19"> <dim>-1</dim> <dim>-1</dim> <dim>9216</dim> </port> </output> </layer> <layer id="1344" name="Constant_9422" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635656" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1345" name="Constant_9424" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635638" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1346" name="Constant_9426" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1347" name="__module.model.model.layers.9.self_attn/aten::slice/Slice_6" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>9216</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="1837,value_states.19"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1348" name="Constant_96626" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="56635456" size="32" /> <rt_info> <attribute name="precise" version="0" /> </rt_info> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="1349" name="__module.model.model.layers.9.self_attn/aten::view/Reshape_2" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1845"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> </output> </layer> <layer id="1350" name="__module.model.model.layers.9.self_attn/aten::transpose/Constant_2" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="56635488" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="1351" name="__module.model.model.layers.9.self_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1846"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="1352" name="__module.model.model.layers.9.self_attn/aten::cat/Concat_3" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="hidden_states.227,present.9.value"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="1354" name="Constant_102422_compressed" type="Const" version="opset1"> <data element_type="f16" shape="" offset="0" size="2" /> <output> <port id="0" precision="FP16" /> </output> </layer> <layer id="1355" name="Constant_102422" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16" /> </input> <output> <port id="1" precision="FP32" /> </output> </layer> <layer id="1356" name="Constant_102415" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="10" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1357" name="Constant_102417" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="2" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1358" name="Constant_102419" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="18" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1359" name="Concat_102420" type="Concat" version="opset1"> <data axis="0" /> <input> <port id="0" precision="I64"> <dim>1</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="4" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="1360" name="Broadcast_102423" type="Broadcast" version="opset3"> <data mode="numpy" /> <input> <port id="0" precision="FP32" /> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>0</dim> <dim>96</dim> </port> </output> </layer> <layer id="1361" name="ReadValue_101171" type="ReadValue" version="opset6"> <data variable_id="past_key_values.9.keypresent.9.key" variable_type="f32" variable_shape="?,32,?,96" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>0</dim> <dim>96</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.9.key"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="1362" name="Constant_99905" type="Const" version="opset1"> <data element_type="i64" shape="" offset="2" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="1363" name="Gather_99906" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="1364" name="Constant_9412" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635432" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1365" name="Constant_9414" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635656" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1366" name="Constant_9416" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1367" name="__module.model.model.layers.9.self_attn/aten::slice/Slice_3" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>9216</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="1836,key_states.41"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1368" name="Constant_96625" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="56635456" size="32" /> <rt_info> <attribute name="precise" version="0" /> </rt_info> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="1369" name="__module.model.model.layers.9.self_attn/aten::view/Reshape_1" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1842"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> </output> </layer> <layer id="1370" name="__module.model.model.layers.9.self_attn/aten::transpose/Constant_1" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="56635488" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="1371" name="__module.model.model.layers.9.self_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1843,key_states.43"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="1372" name="__module.model.model.layers.9.self_attn/aten::mul/Multiply_2" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="1905"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="1373" name="Constant_10112" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635630" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1374" name="Constant_10114" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635638" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1375" name="Constant_10116" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1376" name="__module.model.model.layers.9.self_attn/aten::slice/Slice_4" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="1915,x2.39"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="1377" name="Constant_90129_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1, 1" offset="56635654" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1378" name="Constant_90129" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1379" name="__module.model.model.layers.9.self_attn/aten::neg/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="1916"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="1380" name="Constant_10009" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="2" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1381" name="Constant_10053" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635630" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1382" name="Constant_10055" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1383" name="__module.model.model.layers.9.self_attn/aten::slice/Slice_5" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="1910"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="1384" name="__module.model.model.layers.9.self_attn/aten::cat/Concat_1" type="Concat" version="opset1"> <data axis="-1" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </input> <output> <port id="2" precision="FP32" names="1918"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="1385" name="__module.model.model.layers.9.self_attn/aten::mul/Multiply_3" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="1919"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="1386" name="__module.model.model.layers.9.self_attn/aten::add/Add_1" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="1920"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="1387" name="__module.model.model.layers.9.self_attn/aten::cat/Concat_2" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="hidden_states.225,present.9.key"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="1399" name="Constant_102434_compressed" type="Const" version="opset1"> <data element_type="f16" shape="" offset="0" size="2" /> <output> <port id="0" precision="FP16" /> </output> </layer> <layer id="1400" name="Constant_102434" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16" /> </input> <output> <port id="1" precision="FP32" /> </output> </layer> <layer id="1401" name="Constant_102427" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="10" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1402" name="Constant_102429" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="2" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1403" name="Constant_102431" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="18" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1404" name="Concat_102432" type="Concat" version="opset1"> <data axis="0" /> <input> <port id="0" precision="I64"> <dim>1</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="4" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="1405" name="Broadcast_102435" type="Broadcast" version="opset3"> <data mode="numpy" /> <input> <port id="0" precision="FP32" /> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>0</dim> <dim>96</dim> </port> </output> </layer> <layer id="1406" name="ReadValue_101149" type="ReadValue" version="opset6"> <data variable_id="past_key_values.31.valuepresent.31.value" variable_type="f32" variable_shape="?,32,?,96" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>0</dim> <dim>96</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.31.value"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="1407" name="Constant_100040" type="Const" version="opset1"> <data element_type="i64" shape="" offset="2" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="1408" name="Gather_100041" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="1409" name="Constant_90347_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 3072" offset="2095171924" size="6144" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1410" name="Constant_90347" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1411" name="Constant_9402" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="2" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1412" name="Constant_9404" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635432" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1413" name="Constant_9406" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1414" name="__module.model.model.layers.9.self_attn/aten::slice/Slice" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>9216</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="1835,query_states.19"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1415" name="Constant_96624" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="56635456" size="32" /> <rt_info> <attribute name="precise" version="0" /> </rt_info> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="1416" name="__module.model.model.layers.9.self_attn/aten::view/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1839"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> </output> </layer> <layer id="1417" name="__module.model.model.layers.9.self_attn/aten::transpose/Constant" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="56635488" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="1418" name="__module.model.model.layers.9.self_attn/aten::transpose/Transpose" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1840,q.19"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="1419" name="__module.model.model.layers.9.self_attn/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="1889"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="1420" name="Constant_9969" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635630" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1421" name="Constant_9971" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635638" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1422" name="Constant_9973" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1423" name="__module.model.model.layers.9.self_attn/aten::slice/Slice_1" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="1899,x2.37"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="1424" name="Constant_90128_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1, 1" offset="56635654" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1425" name="Constant_90128" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1426" name="__module.model.model.layers.9.self_attn/aten::neg/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="1900"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="1427" name="Constant_9866" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="2" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1428" name="Constant_9910" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635630" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1429" name="Constant_9912" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1430" name="__module.model.model.layers.9.self_attn/aten::slice/Slice_2" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="1894"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="1431" name="__module.model.model.layers.9.self_attn/aten::cat/Concat" type="Concat" version="opset1"> <data axis="-1" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </input> <output> <port id="2" precision="FP32" names="1902"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="1432" name="__module.model.model.layers.9.self_attn/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="1903"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="1433" name="__module.model.model.layers.9.self_attn/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="1904"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="1434" name="__module.model.model.layers.9.self_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> <data causal="false" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="2" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="3" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>-1</dim> </port> </input> <output> <port id="4" precision="FP32" names="1930,attn_output.37"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="1435" name="__module.model.model.layers.9.self_attn/aten::transpose/Constant_3" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="56635488" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="1436" name="__module.model.model.layers.9.self_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="1931"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> </output> </layer> <layer id="1437" name="Constant_96627" type="Const" version="opset1"> <data element_type="i64" shape="3" offset="56635704" size="24" /> <rt_info> <attribute name="precise" version="0" /> </rt_info> <output> <port id="0" precision="I64"> <dim>3</dim> </port> </output> </layer> <layer id="1438" name="__module.model.model.layers.9.self_attn/aten::view/Reshape_3" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> <port id="1" precision="I64"> <dim>3</dim> </port> </input> <output> <port id="2" precision="FP32" names="1934"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1439" name="self.model.model.layers.9.self_attn.o_proj.weight_compressed" type="Const" version="opset1"> <data element_type="f16" shape="3072, 3072" offset="2095178068" size="18874368" /> <output> <port id="0" precision="FP16" names="self.model.model.layers.9.self_attn.o_proj.weight"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1440" name="self.model.model.layers.9.self_attn.o_proj.weight" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1441" name="__module.model.model.layers.9.self_attn.o_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="1936,1938,input.55"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1442" name="__module.model.model.layers.9/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="1942,1944,1955,hidden_states.229,hidden_states.231"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1443" name="Constant_90133_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 3072" offset="2114052436" size="6144" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1444" name="Constant_90133" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1445" name="Constant_90132_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12314" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1446" name="Constant_90132" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1447" name="Constant_90130_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12316" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1448" name="Constant_90130" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1449" name="__module.model.model.layers.9.post_attention_layernorm/aten::pow/Power" type="Power" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="1945"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1450" name="Constant_10284" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="12318" size="8" /> <output> <port id="0" precision="I64" names="1946"> <dim>1</dim> </port> </output> </layer> <layer id="1451" name="__module.model.model.layers.9.post_attention_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> <data keep_dims="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="1947,variance.39"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1452" name="Constant_90131_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12326" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1453" name="Constant_90131" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1454" name="__module.model.model.layers.9.post_attention_layernorm/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="1948"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1455" name="__module.model.model.layers.9.post_attention_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1456" name="__module.model.model.layers.9.post_attention_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> <data auto_broadcast="numpy" m_pythondiv="true" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="1949"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1457" name="__module.model.model.layers.9.post_attention_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="1950,1951,hidden_states.233,hidden_states.235"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1458" name="__module.model.model.layers.9.post_attention_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="1952,1954"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1459" name="self.model.model.layers.9.mlp.gate_up_proj.weight_compressed" type="Const" version="opset1"> <data element_type="f16" shape="16384, 3072" offset="2114058580" size="100663296" /> <output> <port id="0" precision="FP16" names="self.model.model.layers.9.mlp.gate_up_proj.weight"> <dim>16384</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1460" name="self.model.model.layers.9.mlp.gate_up_proj.weight" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>16384</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>16384</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1461" name="__module.model.model.layers.9.mlp.gate_up_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>16384</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="1959,up_states.37"> <dim>-1</dim> <dim>-1</dim> <dim>16384</dim> </port> </output> </layer> <layer id="1462" name="__module.model.model.layers.9.mlp/prim::ListUnpack/VariadicSplit" type="VariadicSplit" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16384</dim> </port> <port id="1" precision="I64" /> <port id="2" precision="I32"> <dim>2</dim> </port> </input> <output> <port id="3" precision="FP32" names="1961,input.57"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> <port id="4" precision="FP32" names="1962,up_states.39"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> </output> </layer> <layer id="1463" name="__module.model.model.layers.9.mlp.activation_fn/aten::silu/Swish" type="Swish" version="opset4"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> </input> <output> <port id="1" precision="FP32" names="1963"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> </output> </layer> <layer id="1464" name="__module.model.model.layers.9.mlp/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> </input> <output> <port id="2" precision="FP32" names="1964"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> </output> </layer> <layer id="1465" name="self.model.model.layers.9.mlp.down_proj.weight_compressed" type="Const" version="opset1"> <data element_type="f16" shape="3072, 8192" offset="2214721876" size="50331648" /> <output> <port id="0" precision="FP16" names="self.model.model.layers.9.mlp.down_proj.weight"> <dim>3072</dim> <dim>8192</dim> </port> </output> </layer> <layer id="1466" name="self.model.model.layers.9.mlp.down_proj.weight" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>8192</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>3072</dim> <dim>8192</dim> </port> </output> </layer> <layer id="1467" name="__module.model.model.layers.9.mlp.down_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> <port id="1" precision="FP32"> <dim>3072</dim> <dim>8192</dim> </port> </input> <output> <port id="2" precision="FP32" names="1966,input.59"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1468" name="__module.model.model.layers.9/aten::add/Add_1" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="1968,1970,1978,1989,hidden_states.239,hidden_states.241"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1469" name="Constant_90137_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 3072" offset="2265053524" size="6144" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1470" name="Constant_90137" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1471" name="Constant_90136_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12314" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1472" name="Constant_90136" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1473" name="Constant_90134_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12316" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1474" name="Constant_90134" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1475" name="__module.model.model.layers.10.input_layernorm/aten::pow/Power" type="Power" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="1979"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1476" name="Constant_10353" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="12318" size="8" /> <output> <port id="0" precision="I64" names="1980"> <dim>1</dim> </port> </output> </layer> <layer id="1477" name="__module.model.model.layers.10.input_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> <data keep_dims="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="1981,variance.41"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1478" name="Constant_90135_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12326" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1479" name="Constant_90135" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1480" name="__module.model.model.layers.10.input_layernorm/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="1982"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1481" name="__module.model.model.layers.10.input_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1482" name="__module.model.model.layers.10.input_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> <data auto_broadcast="numpy" m_pythondiv="true" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="1983"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1483" name="__module.model.model.layers.10.input_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="1984,1985,hidden_states.243,hidden_states.245"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1484" name="__module.model.model.layers.10.input_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="1986,1988,hidden_states.247"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1485" name="self.model.model.layers.10.self_attn.qkv_proj.weight_compressed" type="Const" version="opset1"> <data element_type="f16" shape="9216, 3072" offset="2265059668" size="56623104" /> <output> <port id="0" precision="FP16" names="self.model.model.layers.10.self_attn.qkv_proj.weight"> <dim>9216</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1486" name="self.model.model.layers.10.self_attn.qkv_proj.weight" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>9216</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>9216</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1487" name="__module.model.model.layers.10.self_attn.qkv_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>9216</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="1995,qkv.21"> <dim>-1</dim> <dim>-1</dim> <dim>9216</dim> </port> </output> </layer> <layer id="1488" name="Constant_10396" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="2" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1489" name="Constant_10398" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635432" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1490" name="Constant_10400" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1491" name="__module.model.model.layers.10.self_attn/aten::slice/Slice" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>9216</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="1996,query_states.21"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1492" name="Constant_96628" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="56635456" size="32" /> <rt_info> <attribute name="precise" version="0" /> </rt_info> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="1493" name="__module.model.model.layers.10.self_attn/aten::view/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2000"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> </output> </layer> <layer id="1494" name="__module.model.model.layers.10.self_attn/aten::transpose/Constant" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="56635488" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="1495" name="__module.model.model.layers.10.self_attn/aten::transpose/Transpose" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2001,q.21"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="1496" name="__module.model.model.layers.10.self_attn/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="2050"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="1497" name="Constant_10963" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635630" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1498" name="Constant_10965" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635638" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1499" name="Constant_10967" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1500" name="__module.model.model.layers.10.self_attn/aten::slice/Slice_1" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="2060,x2.41"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="1501" name="Constant_90138_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1, 1" offset="56635654" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1502" name="Constant_90138" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1503" name="__module.model.model.layers.10.self_attn/aten::neg/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="2061"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="1504" name="Constant_10860" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="2" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1505" name="Constant_10904" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635630" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1506" name="Constant_10906" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1507" name="__module.model.model.layers.10.self_attn/aten::slice/Slice_2" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="2055"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="1508" name="__module.model.model.layers.10.self_attn/aten::cat/Concat" type="Concat" version="opset1"> <data axis="-1" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </input> <output> <port id="2" precision="FP32" names="2063"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="1509" name="__module.model.model.layers.10.self_attn/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="2064"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="1510" name="__module.model.model.layers.10.self_attn/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="2065"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="1511" name="Constant_102458_compressed" type="Const" version="opset1"> <data element_type="f16" shape="" offset="0" size="2" /> <output> <port id="0" precision="FP16" /> </output> </layer> <layer id="1512" name="Constant_102458" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16" /> </input> <output> <port id="1" precision="FP32" /> </output> </layer> <layer id="1513" name="Constant_102451" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="10" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1514" name="Constant_102453" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="2" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1515" name="Constant_102455" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="18" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1516" name="Concat_102456" type="Concat" version="opset1"> <data axis="0" /> <input> <port id="0" precision="I64"> <dim>1</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="4" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="1517" name="Broadcast_102459" type="Broadcast" version="opset3"> <data mode="numpy" /> <input> <port id="0" precision="FP32" /> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>0</dim> <dim>96</dim> </port> </output> </layer> <layer id="1518" name="ReadValue_101055" type="ReadValue" version="opset6"> <data variable_id="past_key_values.10.keypresent.10.key" variable_type="f32" variable_shape="?,32,?,96" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>0</dim> <dim>96</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.10.key"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="1519" name="Constant_99911" type="Const" version="opset1"> <data element_type="i64" shape="" offset="2" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="1520" name="Gather_99912" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="1521" name="Constant_10406" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635432" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1522" name="Constant_10408" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635656" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1523" name="Constant_10410" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1524" name="__module.model.model.layers.10.self_attn/aten::slice/Slice_3" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>9216</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="1997,key_states.45"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1525" name="Constant_96629" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="56635456" size="32" /> <rt_info> <attribute name="precise" version="0" /> </rt_info> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="1526" name="__module.model.model.layers.10.self_attn/aten::view/Reshape_1" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2003"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> </output> </layer> <layer id="1527" name="__module.model.model.layers.10.self_attn/aten::transpose/Constant_1" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="56635488" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="1528" name="__module.model.model.layers.10.self_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2004,key_states.47"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="1529" name="__module.model.model.layers.10.self_attn/aten::mul/Multiply_2" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="2066"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="1530" name="Constant_11106" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635630" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1531" name="Constant_11108" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635638" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1532" name="Constant_11110" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1533" name="__module.model.model.layers.10.self_attn/aten::slice/Slice_4" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="2076,x2.43"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="1534" name="Constant_90139_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1, 1" offset="56635654" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1535" name="Constant_90139" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1536" name="__module.model.model.layers.10.self_attn/aten::neg/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="2077"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="1537" name="Constant_11003" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="2" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1538" name="Constant_11047" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635630" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1539" name="Constant_11049" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1540" name="__module.model.model.layers.10.self_attn/aten::slice/Slice_5" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="2071"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="1541" name="__module.model.model.layers.10.self_attn/aten::cat/Concat_1" type="Concat" version="opset1"> <data axis="-1" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </input> <output> <port id="2" precision="FP32" names="2079"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="1542" name="__module.model.model.layers.10.self_attn/aten::mul/Multiply_3" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="2080"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="1543" name="__module.model.model.layers.10.self_attn/aten::add/Add_1" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="2081"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="1544" name="__module.model.model.layers.10.self_attn/aten::cat/Concat_2" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="hidden_states.249,present.10.key"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="1545" name="Constant_102446_compressed" type="Const" version="opset1"> <data element_type="f16" shape="" offset="0" size="2" /> <output> <port id="0" precision="FP16" /> </output> </layer> <layer id="1546" name="Constant_102446" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16" /> </input> <output> <port id="1" precision="FP32" /> </output> </layer> <layer id="1547" name="Constant_102439" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="10" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1548" name="Constant_102441" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="2" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1549" name="Constant_102443" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="18" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1550" name="Concat_102444" type="Concat" version="opset1"> <data axis="0" /> <input> <port id="0" precision="I64"> <dim>1</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="4" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="1551" name="Broadcast_102447" type="Broadcast" version="opset3"> <data mode="numpy" /> <input> <port id="0" precision="FP32" /> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>0</dim> <dim>96</dim> </port> </output> </layer> <layer id="1552" name="ReadValue_101057" type="ReadValue" version="opset6"> <data variable_id="past_key_values.10.valuepresent.10.value" variable_type="f32" variable_shape="?,32,?,96" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>0</dim> <dim>96</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.10.value"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="1553" name="Constant_99914" type="Const" version="opset1"> <data element_type="i64" shape="" offset="2" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="1554" name="Gather_99915" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="1555" name="Constant_10416" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635656" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1556" name="Constant_10418" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635638" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1557" name="Constant_10420" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1558" name="__module.model.model.layers.10.self_attn/aten::slice/Slice_6" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>9216</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="1998,value_states.21"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1559" name="Constant_96630" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="56635456" size="32" /> <rt_info> <attribute name="precise" version="0" /> </rt_info> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="1560" name="__module.model.model.layers.10.self_attn/aten::view/Reshape_2" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2006"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> </output> </layer> <layer id="1561" name="__module.model.model.layers.10.self_attn/aten::transpose/Constant_2" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="56635488" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="1562" name="__module.model.model.layers.10.self_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2007"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="1563" name="__module.model.model.layers.10.self_attn/aten::cat/Concat_3" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="hidden_states.251,present.10.value"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="1564" name="__module.model.model.layers.10.self_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> <data causal="false" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="2" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="3" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>-1</dim> </port> </input> <output> <port id="4" precision="FP32" names="2091,attn_output.41"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="1565" name="__module.model.model.layers.10.self_attn/aten::transpose/Constant_3" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="56635488" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="1566" name="__module.model.model.layers.10.self_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2092"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> </output> </layer> <layer id="1567" name="Constant_96631" type="Const" version="opset1"> <data element_type="i64" shape="3" offset="56635704" size="24" /> <rt_info> <attribute name="precise" version="0" /> </rt_info> <output> <port id="0" precision="I64"> <dim>3</dim> </port> </output> </layer> <layer id="1568" name="__module.model.model.layers.10.self_attn/aten::view/Reshape_3" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> <port id="1" precision="I64"> <dim>3</dim> </port> </input> <output> <port id="2" precision="FP32" names="2095"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1569" name="self.model.model.layers.10.self_attn.o_proj.weight_compressed" type="Const" version="opset1"> <data element_type="f16" shape="3072, 3072" offset="2321682772" size="18874368" /> <output> <port id="0" precision="FP16" names="self.model.model.layers.10.self_attn.o_proj.weight"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1570" name="self.model.model.layers.10.self_attn.o_proj.weight" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1571" name="__module.model.model.layers.10.self_attn.o_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="2097,2099,input.61"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1572" name="__module.model.model.layers.10/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="2103,2105,2116,hidden_states.253,hidden_states.255"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1573" name="Constant_90143_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 3072" offset="2340557140" size="6144" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1574" name="Constant_90143" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1575" name="Constant_90142_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12314" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1576" name="Constant_90142" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1577" name="Constant_90140_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12316" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1578" name="Constant_90140" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1579" name="__module.model.model.layers.10.post_attention_layernorm/aten::pow/Power" type="Power" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="2106"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1580" name="Constant_11278" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="12318" size="8" /> <output> <port id="0" precision="I64" names="2107"> <dim>1</dim> </port> </output> </layer> <layer id="1581" name="__module.model.model.layers.10.post_attention_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> <data keep_dims="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="2108,variance.43"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1582" name="Constant_90141_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12326" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1583" name="Constant_90141" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1584" name="__module.model.model.layers.10.post_attention_layernorm/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="2109"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1585" name="__module.model.model.layers.10.post_attention_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1586" name="__module.model.model.layers.10.post_attention_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> <data auto_broadcast="numpy" m_pythondiv="true" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="2110"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1587" name="__module.model.model.layers.10.post_attention_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="2111,2112,hidden_states.257,hidden_states.259"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1588" name="__module.model.model.layers.10.post_attention_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="2113,2115"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1589" name="self.model.model.layers.10.mlp.gate_up_proj.weight_compressed" type="Const" version="opset1"> <data element_type="f16" shape="16384, 3072" offset="2340563284" size="100663296" /> <output> <port id="0" precision="FP16" names="self.model.model.layers.10.mlp.gate_up_proj.weight"> <dim>16384</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1590" name="self.model.model.layers.10.mlp.gate_up_proj.weight" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>16384</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>16384</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1591" name="__module.model.model.layers.10.mlp.gate_up_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>16384</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="2120,up_states.41"> <dim>-1</dim> <dim>-1</dim> <dim>16384</dim> </port> </output> </layer> <layer id="1592" name="__module.model.model.layers.10.mlp/prim::ListUnpack/VariadicSplit" type="VariadicSplit" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16384</dim> </port> <port id="1" precision="I64" /> <port id="2" precision="I32"> <dim>2</dim> </port> </input> <output> <port id="3" precision="FP32" names="2122,input.63"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> <port id="4" precision="FP32" names="2123,up_states.43"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> </output> </layer> <layer id="1593" name="__module.model.model.layers.10.mlp.activation_fn/aten::silu/Swish" type="Swish" version="opset4"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> </input> <output> <port id="1" precision="FP32" names="2124"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> </output> </layer> <layer id="1594" name="__module.model.model.layers.10.mlp/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> </input> <output> <port id="2" precision="FP32" names="2125"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> </output> </layer> <layer id="1595" name="self.model.model.layers.10.mlp.down_proj.weight_compressed" type="Const" version="opset1"> <data element_type="f16" shape="3072, 8192" offset="2441226580" size="50331648" /> <output> <port id="0" precision="FP16" names="self.model.model.layers.10.mlp.down_proj.weight"> <dim>3072</dim> <dim>8192</dim> </port> </output> </layer> <layer id="1596" name="self.model.model.layers.10.mlp.down_proj.weight" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>8192</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>3072</dim> <dim>8192</dim> </port> </output> </layer> <layer id="1597" name="__module.model.model.layers.10.mlp.down_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> <port id="1" precision="FP32"> <dim>3072</dim> <dim>8192</dim> </port> </input> <output> <port id="2" precision="FP32" names="2127,input.65"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1598" name="__module.model.model.layers.10/aten::add/Add_1" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="2129,2131,2139,2150,hidden_states.263,hidden_states.265"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1599" name="Constant_90147_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 3072" offset="2491558228" size="6144" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1600" name="Constant_90147" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1601" name="Constant_90146_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12314" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1602" name="Constant_90146" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1603" name="Constant_90144_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12316" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1604" name="Constant_90144" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1605" name="__module.model.model.layers.11.input_layernorm/aten::pow/Power" type="Power" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="2140"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1606" name="Constant_11347" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="12318" size="8" /> <output> <port id="0" precision="I64" names="2141"> <dim>1</dim> </port> </output> </layer> <layer id="1607" name="__module.model.model.layers.11.input_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> <data keep_dims="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="2142,variance.45"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1608" name="Constant_90145_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12326" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1609" name="Constant_90145" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1610" name="__module.model.model.layers.11.input_layernorm/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="2143"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1611" name="__module.model.model.layers.11.input_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1612" name="__module.model.model.layers.11.input_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> <data auto_broadcast="numpy" m_pythondiv="true" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="2144"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1613" name="__module.model.model.layers.11.input_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="2145,2146,hidden_states.267,hidden_states.269"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1614" name="__module.model.model.layers.11.input_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="2147,2149,hidden_states.271"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1615" name="self.model.model.layers.11.self_attn.qkv_proj.weight_compressed" type="Const" version="opset1"> <data element_type="f16" shape="9216, 3072" offset="2491564372" size="56623104" /> <output> <port id="0" precision="FP16" names="self.model.model.layers.11.self_attn.qkv_proj.weight"> <dim>9216</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1616" name="self.model.model.layers.11.self_attn.qkv_proj.weight" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>9216</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>9216</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1617" name="__module.model.model.layers.11.self_attn.qkv_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>9216</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="2156,qkv.23"> <dim>-1</dim> <dim>-1</dim> <dim>9216</dim> </port> </output> </layer> <layer id="1618" name="Constant_11390" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="2" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1619" name="Constant_11392" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635432" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1620" name="Constant_11394" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1621" name="__module.model.model.layers.11.self_attn/aten::slice/Slice" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>9216</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="2157,query_states.23"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1622" name="Constant_96632" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="56635456" size="32" /> <rt_info> <attribute name="precise" version="0" /> </rt_info> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="1623" name="__module.model.model.layers.11.self_attn/aten::view/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2161"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> </output> </layer> <layer id="1624" name="__module.model.model.layers.11.self_attn/aten::transpose/Constant" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="56635488" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="1625" name="__module.model.model.layers.11.self_attn/aten::transpose/Transpose" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2162,q.23"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="1626" name="__module.model.model.layers.11.self_attn/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="2211"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="1627" name="Constant_11957" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635630" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1628" name="Constant_11959" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635638" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1629" name="Constant_11961" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1630" name="__module.model.model.layers.11.self_attn/aten::slice/Slice_1" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="2221,x2.45"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="1631" name="Constant_90148_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1, 1" offset="56635654" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1632" name="Constant_90148" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1633" name="__module.model.model.layers.11.self_attn/aten::neg/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="2222"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="1634" name="Constant_11854" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="2" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1635" name="Constant_11898" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635630" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1636" name="Constant_11900" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1637" name="__module.model.model.layers.11.self_attn/aten::slice/Slice_2" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="2216"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="1638" name="__module.model.model.layers.11.self_attn/aten::cat/Concat" type="Concat" version="opset1"> <data axis="-1" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </input> <output> <port id="2" precision="FP32" names="2224"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="1639" name="__module.model.model.layers.11.self_attn/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="2225"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="1640" name="__module.model.model.layers.11.self_attn/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="2226"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="1641" name="Constant_102482_compressed" type="Const" version="opset1"> <data element_type="f16" shape="" offset="0" size="2" /> <output> <port id="0" precision="FP16" /> </output> </layer> <layer id="1642" name="Constant_102482" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16" /> </input> <output> <port id="1" precision="FP32" /> </output> </layer> <layer id="1643" name="Constant_102475" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="10" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1644" name="Constant_102477" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="2" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1645" name="Constant_102479" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="18" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1646" name="Concat_102480" type="Concat" version="opset1"> <data axis="0" /> <input> <port id="0" precision="I64"> <dim>1</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="4" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="1647" name="Broadcast_102483" type="Broadcast" version="opset3"> <data mode="numpy" /> <input> <port id="0" precision="FP32" /> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>0</dim> <dim>96</dim> </port> </output> </layer> <layer id="1648" name="ReadValue_101059" type="ReadValue" version="opset6"> <data variable_id="past_key_values.11.keypresent.11.key" variable_type="f32" variable_shape="?,32,?,96" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>0</dim> <dim>96</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.11.key"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="1649" name="Constant_99917" type="Const" version="opset1"> <data element_type="i64" shape="" offset="2" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="1650" name="Gather_99918" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="1651" name="Constant_11400" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635432" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1652" name="Constant_11402" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635656" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1653" name="Constant_11404" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1654" name="__module.model.model.layers.11.self_attn/aten::slice/Slice_3" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>9216</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="2158,key_states.49"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1655" name="Constant_96633" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="56635456" size="32" /> <rt_info> <attribute name="precise" version="0" /> </rt_info> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="1656" name="__module.model.model.layers.11.self_attn/aten::view/Reshape_1" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2164"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> </output> </layer> <layer id="1657" name="__module.model.model.layers.11.self_attn/aten::transpose/Constant_1" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="56635488" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="1658" name="__module.model.model.layers.11.self_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2165,key_states.51"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="1659" name="__module.model.model.layers.11.self_attn/aten::mul/Multiply_2" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="2227"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="1660" name="Constant_12100" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635630" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1661" name="Constant_12102" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635638" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1662" name="Constant_12104" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1663" name="__module.model.model.layers.11.self_attn/aten::slice/Slice_4" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="2237,x2.47"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="1664" name="Constant_90149_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1, 1" offset="56635654" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1665" name="Constant_90149" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1666" name="__module.model.model.layers.11.self_attn/aten::neg/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="2238"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="1667" name="Constant_11997" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="2" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1668" name="Constant_12041" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635630" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1669" name="Constant_12043" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1670" name="__module.model.model.layers.11.self_attn/aten::slice/Slice_5" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="2232"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="1671" name="__module.model.model.layers.11.self_attn/aten::cat/Concat_1" type="Concat" version="opset1"> <data axis="-1" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </input> <output> <port id="2" precision="FP32" names="2240"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="1672" name="__module.model.model.layers.11.self_attn/aten::mul/Multiply_3" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="2241"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="1673" name="__module.model.model.layers.11.self_attn/aten::add/Add_1" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="2242"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="1674" name="__module.model.model.layers.11.self_attn/aten::cat/Concat_2" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="hidden_states.273,present.11.key"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="1675" name="Constant_102470_compressed" type="Const" version="opset1"> <data element_type="f16" shape="" offset="0" size="2" /> <output> <port id="0" precision="FP16" /> </output> </layer> <layer id="1676" name="Constant_102470" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16" /> </input> <output> <port id="1" precision="FP32" /> </output> </layer> <layer id="1677" name="Constant_102463" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="10" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1678" name="Constant_102465" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="2" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1679" name="Constant_102467" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="18" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1680" name="Concat_102468" type="Concat" version="opset1"> <data axis="0" /> <input> <port id="0" precision="I64"> <dim>1</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="4" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="1681" name="Broadcast_102471" type="Broadcast" version="opset3"> <data mode="numpy" /> <input> <port id="0" precision="FP32" /> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>0</dim> <dim>96</dim> </port> </output> </layer> <layer id="1682" name="ReadValue_101061" type="ReadValue" version="opset6"> <data variable_id="past_key_values.11.valuepresent.11.value" variable_type="f32" variable_shape="?,32,?,96" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>0</dim> <dim>96</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.11.value"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="1683" name="Constant_99920" type="Const" version="opset1"> <data element_type="i64" shape="" offset="2" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="1684" name="Gather_99921" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="1685" name="Constant_11410" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635656" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1686" name="Constant_11412" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635638" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1687" name="Constant_11414" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1688" name="__module.model.model.layers.11.self_attn/aten::slice/Slice_6" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>9216</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="2159,value_states.23"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1689" name="Constant_96634" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="56635456" size="32" /> <rt_info> <attribute name="precise" version="0" /> </rt_info> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="1690" name="__module.model.model.layers.11.self_attn/aten::view/Reshape_2" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2167"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> </output> </layer> <layer id="1691" name="__module.model.model.layers.11.self_attn/aten::transpose/Constant_2" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="56635488" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="1692" name="__module.model.model.layers.11.self_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2168"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="1693" name="__module.model.model.layers.11.self_attn/aten::cat/Concat_3" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="hidden_states.275,present.11.value"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="1694" name="__module.model.model.layers.11.self_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> <data causal="false" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="2" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="3" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>-1</dim> </port> </input> <output> <port id="4" precision="FP32" names="2252,attn_output.45"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="1695" name="__module.model.model.layers.11.self_attn/aten::transpose/Constant_3" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="56635488" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="1696" name="__module.model.model.layers.11.self_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2253"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> </output> </layer> <layer id="1697" name="Constant_96635" type="Const" version="opset1"> <data element_type="i64" shape="3" offset="56635704" size="24" /> <rt_info> <attribute name="precise" version="0" /> </rt_info> <output> <port id="0" precision="I64"> <dim>3</dim> </port> </output> </layer> <layer id="1698" name="__module.model.model.layers.11.self_attn/aten::view/Reshape_3" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> <port id="1" precision="I64"> <dim>3</dim> </port> </input> <output> <port id="2" precision="FP32" names="2256"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1699" name="self.model.model.layers.11.self_attn.o_proj.weight_compressed" type="Const" version="opset1"> <data element_type="f16" shape="3072, 3072" offset="2548187476" size="18874368" /> <output> <port id="0" precision="FP16" names="self.model.model.layers.11.self_attn.o_proj.weight"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1700" name="self.model.model.layers.11.self_attn.o_proj.weight" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1701" name="__module.model.model.layers.11.self_attn.o_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="2258,2260,input.67"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1702" name="__module.model.model.layers.11/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="2264,2266,2277,hidden_states.277,hidden_states.279"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1703" name="Constant_90153_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 3072" offset="2567061844" size="6144" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1704" name="Constant_90153" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1705" name="Constant_90152_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12314" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1706" name="Constant_90152" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1707" name="Constant_90150_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12316" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1708" name="Constant_90150" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1709" name="__module.model.model.layers.11.post_attention_layernorm/aten::pow/Power" type="Power" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="2267"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1710" name="Constant_12272" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="12318" size="8" /> <output> <port id="0" precision="I64" names="2268"> <dim>1</dim> </port> </output> </layer> <layer id="1711" name="__module.model.model.layers.11.post_attention_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> <data keep_dims="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="2269,variance.47"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1712" name="Constant_90151_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12326" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1713" name="Constant_90151" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1714" name="__module.model.model.layers.11.post_attention_layernorm/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="2270"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1715" name="__module.model.model.layers.11.post_attention_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1716" name="__module.model.model.layers.11.post_attention_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> <data auto_broadcast="numpy" m_pythondiv="true" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="2271"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1717" name="__module.model.model.layers.11.post_attention_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="2272,2273,hidden_states.281,hidden_states.283"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1718" name="__module.model.model.layers.11.post_attention_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="2274,2276"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1719" name="self.model.model.layers.11.mlp.gate_up_proj.weight_compressed" type="Const" version="opset1"> <data element_type="f16" shape="16384, 3072" offset="2567067988" size="100663296" /> <output> <port id="0" precision="FP16" names="self.model.model.layers.11.mlp.gate_up_proj.weight"> <dim>16384</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1720" name="self.model.model.layers.11.mlp.gate_up_proj.weight" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>16384</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>16384</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1721" name="__module.model.model.layers.11.mlp.gate_up_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>16384</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="2281,up_states.45"> <dim>-1</dim> <dim>-1</dim> <dim>16384</dim> </port> </output> </layer> <layer id="1722" name="__module.model.model.layers.11.mlp/prim::ListUnpack/VariadicSplit" type="VariadicSplit" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16384</dim> </port> <port id="1" precision="I64" /> <port id="2" precision="I32"> <dim>2</dim> </port> </input> <output> <port id="3" precision="FP32" names="2283,input.69"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> <port id="4" precision="FP32" names="2284,up_states.47"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> </output> </layer> <layer id="1723" name="__module.model.model.layers.11.mlp.activation_fn/aten::silu/Swish" type="Swish" version="opset4"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> </input> <output> <port id="1" precision="FP32" names="2285"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> </output> </layer> <layer id="1724" name="__module.model.model.layers.11.mlp/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> </input> <output> <port id="2" precision="FP32" names="2286"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> </output> </layer> <layer id="1725" name="self.model.model.layers.11.mlp.down_proj.weight_compressed" type="Const" version="opset1"> <data element_type="f16" shape="3072, 8192" offset="2667731284" size="50331648" /> <output> <port id="0" precision="FP16" names="self.model.model.layers.11.mlp.down_proj.weight"> <dim>3072</dim> <dim>8192</dim> </port> </output> </layer> <layer id="1726" name="self.model.model.layers.11.mlp.down_proj.weight" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>8192</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>3072</dim> <dim>8192</dim> </port> </output> </layer> <layer id="1727" name="__module.model.model.layers.11.mlp.down_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> <port id="1" precision="FP32"> <dim>3072</dim> <dim>8192</dim> </port> </input> <output> <port id="2" precision="FP32" names="2288,input.71"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1728" name="__module.model.model.layers.11/aten::add/Add_1" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="2290,2292,2300,2311,hidden_states.287,hidden_states.289"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1729" name="Constant_90157_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 3072" offset="2718062932" size="6144" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1730" name="Constant_90157" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1731" name="Constant_90156_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12314" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1732" name="Constant_90156" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1733" name="Constant_90154_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12316" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1734" name="Constant_90154" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1735" name="__module.model.model.layers.12.input_layernorm/aten::pow/Power" type="Power" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="2301"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1736" name="Constant_12341" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="12318" size="8" /> <output> <port id="0" precision="I64" names="2302"> <dim>1</dim> </port> </output> </layer> <layer id="1737" name="__module.model.model.layers.12.input_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> <data keep_dims="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="2303,variance.49"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1738" name="Constant_90155_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12326" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1739" name="Constant_90155" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1740" name="__module.model.model.layers.12.input_layernorm/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="2304"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1741" name="__module.model.model.layers.12.input_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1742" name="__module.model.model.layers.12.input_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> <data auto_broadcast="numpy" m_pythondiv="true" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="2305"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1743" name="__module.model.model.layers.12.input_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="2306,2307,hidden_states.291,hidden_states.293"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1744" name="__module.model.model.layers.12.input_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="2308,2310,hidden_states.295"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1745" name="self.model.model.layers.12.self_attn.qkv_proj.weight_compressed" type="Const" version="opset1"> <data element_type="f16" shape="9216, 3072" offset="2718069076" size="56623104" /> <output> <port id="0" precision="FP16" names="self.model.model.layers.12.self_attn.qkv_proj.weight"> <dim>9216</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1746" name="self.model.model.layers.12.self_attn.qkv_proj.weight" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>9216</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>9216</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1747" name="__module.model.model.layers.12.self_attn.qkv_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>9216</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="2317,qkv.25"> <dim>-1</dim> <dim>-1</dim> <dim>9216</dim> </port> </output> </layer> <layer id="1748" name="Constant_12384" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="2" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1749" name="Constant_12386" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635432" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1750" name="Constant_12388" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1751" name="__module.model.model.layers.12.self_attn/aten::slice/Slice" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>9216</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="2318,query_states.25"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1752" name="Constant_96636" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="56635456" size="32" /> <rt_info> <attribute name="precise" version="0" /> </rt_info> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="1753" name="__module.model.model.layers.12.self_attn/aten::view/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2322"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> </output> </layer> <layer id="1754" name="__module.model.model.layers.12.self_attn/aten::transpose/Constant" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="56635488" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="1755" name="__module.model.model.layers.12.self_attn/aten::transpose/Transpose" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2323,q.25"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="1756" name="__module.model.model.layers.12.self_attn/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="2372"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="1757" name="Constant_12951" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635630" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1758" name="Constant_12953" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635638" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1759" name="Constant_12955" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1760" name="__module.model.model.layers.12.self_attn/aten::slice/Slice_1" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="2382,x2.49"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="1761" name="Constant_90158_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1, 1" offset="56635654" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1762" name="Constant_90158" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1763" name="__module.model.model.layers.12.self_attn/aten::neg/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="2383"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="1764" name="Constant_12848" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="2" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1765" name="Constant_12892" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635630" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1766" name="Constant_12894" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1767" name="__module.model.model.layers.12.self_attn/aten::slice/Slice_2" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="2377"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="1768" name="__module.model.model.layers.12.self_attn/aten::cat/Concat" type="Concat" version="opset1"> <data axis="-1" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </input> <output> <port id="2" precision="FP32" names="2385"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="1769" name="__module.model.model.layers.12.self_attn/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="2386"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="1770" name="__module.model.model.layers.12.self_attn/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="2387"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="1771" name="Constant_102506_compressed" type="Const" version="opset1"> <data element_type="f16" shape="" offset="0" size="2" /> <output> <port id="0" precision="FP16" /> </output> </layer> <layer id="1772" name="Constant_102506" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16" /> </input> <output> <port id="1" precision="FP32" /> </output> </layer> <layer id="1773" name="Constant_102499" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="10" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1774" name="Constant_102501" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="2" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1775" name="Constant_102503" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="18" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1776" name="Concat_102504" type="Concat" version="opset1"> <data axis="0" /> <input> <port id="0" precision="I64"> <dim>1</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="4" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="1777" name="Broadcast_102507" type="Broadcast" version="opset3"> <data mode="numpy" /> <input> <port id="0" precision="FP32" /> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>0</dim> <dim>96</dim> </port> </output> </layer> <layer id="1778" name="ReadValue_101063" type="ReadValue" version="opset6"> <data variable_id="past_key_values.12.keypresent.12.key" variable_type="f32" variable_shape="?,32,?,96" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>0</dim> <dim>96</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.12.key"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="1779" name="Constant_99923" type="Const" version="opset1"> <data element_type="i64" shape="" offset="2" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="1780" name="Gather_99924" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="1781" name="Constant_12394" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635432" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1782" name="Constant_12396" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635656" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1783" name="Constant_12398" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1784" name="__module.model.model.layers.12.self_attn/aten::slice/Slice_3" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>9216</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="2319,key_states.53"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1785" name="Constant_96637" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="56635456" size="32" /> <rt_info> <attribute name="precise" version="0" /> </rt_info> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="1786" name="__module.model.model.layers.12.self_attn/aten::view/Reshape_1" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2325"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> </output> </layer> <layer id="1787" name="__module.model.model.layers.12.self_attn/aten::transpose/Constant_1" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="56635488" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="1788" name="__module.model.model.layers.12.self_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2326,key_states.55"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="1789" name="__module.model.model.layers.12.self_attn/aten::mul/Multiply_2" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="2388"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="1790" name="Constant_13094" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635630" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1791" name="Constant_13096" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635638" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1792" name="Constant_13098" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1793" name="__module.model.model.layers.12.self_attn/aten::slice/Slice_4" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="2398,x2.51"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="1794" name="Constant_90159_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1, 1" offset="56635654" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1795" name="Constant_90159" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1796" name="__module.model.model.layers.12.self_attn/aten::neg/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="2399"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="1797" name="Constant_12991" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="2" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1798" name="Constant_13035" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635630" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1799" name="Constant_13037" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1800" name="__module.model.model.layers.12.self_attn/aten::slice/Slice_5" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="2393"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="1801" name="__module.model.model.layers.12.self_attn/aten::cat/Concat_1" type="Concat" version="opset1"> <data axis="-1" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </input> <output> <port id="2" precision="FP32" names="2401"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="1802" name="__module.model.model.layers.12.self_attn/aten::mul/Multiply_3" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="2402"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="1803" name="__module.model.model.layers.12.self_attn/aten::add/Add_1" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="2403"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="1804" name="__module.model.model.layers.12.self_attn/aten::cat/Concat_2" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="hidden_states.297,present.12.key"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="1805" name="Constant_102494_compressed" type="Const" version="opset1"> <data element_type="f16" shape="" offset="0" size="2" /> <output> <port id="0" precision="FP16" /> </output> </layer> <layer id="1806" name="Constant_102494" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16" /> </input> <output> <port id="1" precision="FP32" /> </output> </layer> <layer id="1807" name="Constant_102487" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="10" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1808" name="Constant_102489" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="2" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1809" name="Constant_102491" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="18" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1810" name="Concat_102492" type="Concat" version="opset1"> <data axis="0" /> <input> <port id="0" precision="I64"> <dim>1</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="4" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="1811" name="Broadcast_102495" type="Broadcast" version="opset3"> <data mode="numpy" /> <input> <port id="0" precision="FP32" /> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>0</dim> <dim>96</dim> </port> </output> </layer> <layer id="1812" name="ReadValue_101065" type="ReadValue" version="opset6"> <data variable_id="past_key_values.12.valuepresent.12.value" variable_type="f32" variable_shape="?,32,?,96" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>0</dim> <dim>96</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.12.value"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="1813" name="Constant_99926" type="Const" version="opset1"> <data element_type="i64" shape="" offset="2" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="1814" name="Gather_99927" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="1815" name="Constant_12404" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635656" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1816" name="Constant_12406" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635638" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1817" name="Constant_12408" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1818" name="__module.model.model.layers.12.self_attn/aten::slice/Slice_6" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>9216</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="2320,value_states.25"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1819" name="Constant_96638" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="56635456" size="32" /> <rt_info> <attribute name="precise" version="0" /> </rt_info> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="1820" name="__module.model.model.layers.12.self_attn/aten::view/Reshape_2" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2328"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> </output> </layer> <layer id="1821" name="__module.model.model.layers.12.self_attn/aten::transpose/Constant_2" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="56635488" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="1822" name="__module.model.model.layers.12.self_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2329"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="1823" name="__module.model.model.layers.12.self_attn/aten::cat/Concat_3" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="hidden_states.299,present.12.value"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="1824" name="__module.model.model.layers.12.self_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> <data causal="false" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="2" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="3" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>-1</dim> </port> </input> <output> <port id="4" precision="FP32" names="2413,attn_output.49"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="1825" name="__module.model.model.layers.12.self_attn/aten::transpose/Constant_3" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="56635488" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="1826" name="__module.model.model.layers.12.self_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2414"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> </output> </layer> <layer id="1827" name="Constant_96639" type="Const" version="opset1"> <data element_type="i64" shape="3" offset="56635704" size="24" /> <rt_info> <attribute name="precise" version="0" /> </rt_info> <output> <port id="0" precision="I64"> <dim>3</dim> </port> </output> </layer> <layer id="1828" name="__module.model.model.layers.12.self_attn/aten::view/Reshape_3" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> <port id="1" precision="I64"> <dim>3</dim> </port> </input> <output> <port id="2" precision="FP32" names="2417"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1829" name="self.model.model.layers.12.self_attn.o_proj.weight_compressed" type="Const" version="opset1"> <data element_type="f16" shape="3072, 3072" offset="2774692180" size="18874368" /> <output> <port id="0" precision="FP16" names="self.model.model.layers.12.self_attn.o_proj.weight"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1830" name="self.model.model.layers.12.self_attn.o_proj.weight" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1831" name="__module.model.model.layers.12.self_attn.o_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="2419,2421,input.73"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1832" name="__module.model.model.layers.12/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="2425,2427,2438,hidden_states.301,hidden_states.303"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1833" name="Constant_90163_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 3072" offset="2793566548" size="6144" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1834" name="Constant_90163" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1835" name="Constant_90162_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12314" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1836" name="Constant_90162" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1837" name="Constant_90160_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12316" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1838" name="Constant_90160" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1839" name="__module.model.model.layers.12.post_attention_layernorm/aten::pow/Power" type="Power" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="2428"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1840" name="Constant_13266" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="12318" size="8" /> <output> <port id="0" precision="I64" names="2429"> <dim>1</dim> </port> </output> </layer> <layer id="1841" name="__module.model.model.layers.12.post_attention_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> <data keep_dims="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="2430,variance.51"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1842" name="Constant_90161_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12326" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1843" name="Constant_90161" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1844" name="__module.model.model.layers.12.post_attention_layernorm/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="2431"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1845" name="__module.model.model.layers.12.post_attention_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1846" name="__module.model.model.layers.12.post_attention_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> <data auto_broadcast="numpy" m_pythondiv="true" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="2432"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1847" name="__module.model.model.layers.12.post_attention_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="2433,2434,hidden_states.305,hidden_states.307"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1848" name="__module.model.model.layers.12.post_attention_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="2435,2437"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1849" name="self.model.model.layers.12.mlp.gate_up_proj.weight_compressed" type="Const" version="opset1"> <data element_type="f16" shape="16384, 3072" offset="2793572692" size="100663296" /> <output> <port id="0" precision="FP16" names="self.model.model.layers.12.mlp.gate_up_proj.weight"> <dim>16384</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1850" name="self.model.model.layers.12.mlp.gate_up_proj.weight" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>16384</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>16384</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1851" name="__module.model.model.layers.12.mlp.gate_up_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>16384</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="2442,up_states.49"> <dim>-1</dim> <dim>-1</dim> <dim>16384</dim> </port> </output> </layer> <layer id="1852" name="__module.model.model.layers.12.mlp/prim::ListUnpack/VariadicSplit" type="VariadicSplit" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16384</dim> </port> <port id="1" precision="I64" /> <port id="2" precision="I32"> <dim>2</dim> </port> </input> <output> <port id="3" precision="FP32" names="2444,input.75"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> <port id="4" precision="FP32" names="2445,up_states.51"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> </output> </layer> <layer id="1853" name="__module.model.model.layers.12.mlp.activation_fn/aten::silu/Swish" type="Swish" version="opset4"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> </input> <output> <port id="1" precision="FP32" names="2446"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> </output> </layer> <layer id="1854" name="__module.model.model.layers.12.mlp/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> </input> <output> <port id="2" precision="FP32" names="2447"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> </output> </layer> <layer id="1855" name="self.model.model.layers.12.mlp.down_proj.weight_compressed" type="Const" version="opset1"> <data element_type="f16" shape="3072, 8192" offset="2894235988" size="50331648" /> <output> <port id="0" precision="FP16" names="self.model.model.layers.12.mlp.down_proj.weight"> <dim>3072</dim> <dim>8192</dim> </port> </output> </layer> <layer id="1856" name="self.model.model.layers.12.mlp.down_proj.weight" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>8192</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>3072</dim> <dim>8192</dim> </port> </output> </layer> <layer id="1857" name="__module.model.model.layers.12.mlp.down_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> <port id="1" precision="FP32"> <dim>3072</dim> <dim>8192</dim> </port> </input> <output> <port id="2" precision="FP32" names="2449,input.77"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1858" name="__module.model.model.layers.12/aten::add/Add_1" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="2451,2453,2461,2472,hidden_states.311,hidden_states.313"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1859" name="Constant_90167_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 3072" offset="2944567636" size="6144" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1860" name="Constant_90167" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1861" name="Constant_90166_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12314" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1862" name="Constant_90166" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1863" name="Constant_90164_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12316" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1864" name="Constant_90164" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1865" name="__module.model.model.layers.13.input_layernorm/aten::pow/Power" type="Power" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="2462"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1866" name="Constant_13335" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="12318" size="8" /> <output> <port id="0" precision="I64" names="2463"> <dim>1</dim> </port> </output> </layer> <layer id="1867" name="__module.model.model.layers.13.input_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> <data keep_dims="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="2464,variance.53"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1868" name="Constant_90165_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12326" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1869" name="Constant_90165" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1870" name="__module.model.model.layers.13.input_layernorm/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="2465"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1871" name="__module.model.model.layers.13.input_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1872" name="__module.model.model.layers.13.input_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> <data auto_broadcast="numpy" m_pythondiv="true" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="2466"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1873" name="__module.model.model.layers.13.input_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="2467,2468,hidden_states.315,hidden_states.317"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1874" name="__module.model.model.layers.13.input_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="2469,2471,hidden_states.319"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1875" name="self.model.model.layers.13.self_attn.qkv_proj.weight_compressed" type="Const" version="opset1"> <data element_type="f16" shape="9216, 3072" offset="2944573780" size="56623104" /> <output> <port id="0" precision="FP16" names="self.model.model.layers.13.self_attn.qkv_proj.weight"> <dim>9216</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1876" name="self.model.model.layers.13.self_attn.qkv_proj.weight" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>9216</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>9216</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1877" name="__module.model.model.layers.13.self_attn.qkv_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>9216</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="2478,qkv.27"> <dim>-1</dim> <dim>-1</dim> <dim>9216</dim> </port> </output> </layer> <layer id="1878" name="Constant_13378" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="2" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1879" name="Constant_13380" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635432" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1880" name="Constant_13382" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1881" name="__module.model.model.layers.13.self_attn/aten::slice/Slice" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>9216</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="2479,query_states.27"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1882" name="Constant_96640" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="56635456" size="32" /> <rt_info> <attribute name="precise" version="0" /> </rt_info> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="1883" name="__module.model.model.layers.13.self_attn/aten::view/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2483"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> </output> </layer> <layer id="1884" name="__module.model.model.layers.13.self_attn/aten::transpose/Constant" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="56635488" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="1885" name="__module.model.model.layers.13.self_attn/aten::transpose/Transpose" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2484,q.27"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="1886" name="__module.model.model.layers.13.self_attn/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="2533"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="1887" name="Constant_13945" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635630" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1888" name="Constant_13947" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635638" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1889" name="Constant_13949" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1890" name="__module.model.model.layers.13.self_attn/aten::slice/Slice_1" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="2543,x2.53"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="1891" name="Constant_90168_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1, 1" offset="56635654" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1892" name="Constant_90168" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1893" name="__module.model.model.layers.13.self_attn/aten::neg/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="2544"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="1894" name="Constant_13842" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="2" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1895" name="Constant_13886" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635630" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1896" name="Constant_13888" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1897" name="__module.model.model.layers.13.self_attn/aten::slice/Slice_2" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="2538"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="1898" name="__module.model.model.layers.13.self_attn/aten::cat/Concat" type="Concat" version="opset1"> <data axis="-1" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </input> <output> <port id="2" precision="FP32" names="2546"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="1899" name="__module.model.model.layers.13.self_attn/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="2547"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="1900" name="__module.model.model.layers.13.self_attn/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="2548"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="1901" name="Constant_102530_compressed" type="Const" version="opset1"> <data element_type="f16" shape="" offset="0" size="2" /> <output> <port id="0" precision="FP16" /> </output> </layer> <layer id="1902" name="Constant_102530" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16" /> </input> <output> <port id="1" precision="FP32" /> </output> </layer> <layer id="1903" name="Constant_102523" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="10" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1904" name="Constant_102525" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="2" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1905" name="Constant_102527" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="18" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1906" name="Concat_102528" type="Concat" version="opset1"> <data axis="0" /> <input> <port id="0" precision="I64"> <dim>1</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="4" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="1907" name="Broadcast_102531" type="Broadcast" version="opset3"> <data mode="numpy" /> <input> <port id="0" precision="FP32" /> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>0</dim> <dim>96</dim> </port> </output> </layer> <layer id="1908" name="ReadValue_101067" type="ReadValue" version="opset6"> <data variable_id="past_key_values.13.keypresent.13.key" variable_type="f32" variable_shape="?,32,?,96" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>0</dim> <dim>96</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.13.key"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="1909" name="Constant_99929" type="Const" version="opset1"> <data element_type="i64" shape="" offset="2" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="1910" name="Gather_99930" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="1911" name="Constant_13388" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635432" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1912" name="Constant_13390" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635656" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1913" name="Constant_13392" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1914" name="__module.model.model.layers.13.self_attn/aten::slice/Slice_3" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>9216</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="2480,key_states.57"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1915" name="Constant_96641" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="56635456" size="32" /> <rt_info> <attribute name="precise" version="0" /> </rt_info> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="1916" name="__module.model.model.layers.13.self_attn/aten::view/Reshape_1" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2486"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> </output> </layer> <layer id="1917" name="__module.model.model.layers.13.self_attn/aten::transpose/Constant_1" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="56635488" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="1918" name="__module.model.model.layers.13.self_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2487,key_states.59"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="1919" name="__module.model.model.layers.13.self_attn/aten::mul/Multiply_2" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="2549"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="1920" name="Constant_14088" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635630" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1921" name="Constant_14090" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635638" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1922" name="Constant_14092" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1923" name="__module.model.model.layers.13.self_attn/aten::slice/Slice_4" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="2559,x2.55"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="1924" name="Constant_90169_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1, 1" offset="56635654" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1925" name="Constant_90169" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1926" name="__module.model.model.layers.13.self_attn/aten::neg/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="2560"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="1927" name="Constant_13985" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="2" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1928" name="Constant_14029" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635630" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1929" name="Constant_14031" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1930" name="__module.model.model.layers.13.self_attn/aten::slice/Slice_5" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="2554"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="1931" name="__module.model.model.layers.13.self_attn/aten::cat/Concat_1" type="Concat" version="opset1"> <data axis="-1" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </input> <output> <port id="2" precision="FP32" names="2562"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="1932" name="__module.model.model.layers.13.self_attn/aten::mul/Multiply_3" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="2563"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="1933" name="__module.model.model.layers.13.self_attn/aten::add/Add_1" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="2564"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="1934" name="__module.model.model.layers.13.self_attn/aten::cat/Concat_2" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="hidden_states.321,present.13.key"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="1935" name="Constant_102518_compressed" type="Const" version="opset1"> <data element_type="f16" shape="" offset="0" size="2" /> <output> <port id="0" precision="FP16" /> </output> </layer> <layer id="1936" name="Constant_102518" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16" /> </input> <output> <port id="1" precision="FP32" /> </output> </layer> <layer id="1937" name="Constant_102511" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="10" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1938" name="Constant_102513" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="2" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1939" name="Constant_102515" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="18" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1940" name="Concat_102516" type="Concat" version="opset1"> <data axis="0" /> <input> <port id="0" precision="I64"> <dim>1</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="4" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="1941" name="Broadcast_102519" type="Broadcast" version="opset3"> <data mode="numpy" /> <input> <port id="0" precision="FP32" /> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>0</dim> <dim>96</dim> </port> </output> </layer> <layer id="1942" name="ReadValue_101069" type="ReadValue" version="opset6"> <data variable_id="past_key_values.13.valuepresent.13.value" variable_type="f32" variable_shape="?,32,?,96" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>0</dim> <dim>96</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.13.value"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="1943" name="Constant_99932" type="Const" version="opset1"> <data element_type="i64" shape="" offset="2" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="1944" name="Gather_99933" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="1945" name="Constant_13398" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635656" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1946" name="Constant_13400" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635638" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1947" name="Constant_13402" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="1948" name="__module.model.model.layers.13.self_attn/aten::slice/Slice_6" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>9216</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="2481,value_states.27"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1949" name="Constant_96642" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="56635456" size="32" /> <rt_info> <attribute name="precise" version="0" /> </rt_info> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="1950" name="__module.model.model.layers.13.self_attn/aten::view/Reshape_2" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2489"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> </output> </layer> <layer id="1951" name="__module.model.model.layers.13.self_attn/aten::transpose/Constant_2" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="56635488" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="1952" name="__module.model.model.layers.13.self_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2490"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="1953" name="__module.model.model.layers.13.self_attn/aten::cat/Concat_3" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="hidden_states.323,present.13.value"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="1954" name="__module.model.model.layers.13.self_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> <data causal="false" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="2" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="3" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>-1</dim> </port> </input> <output> <port id="4" precision="FP32" names="2574,attn_output.53"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="1955" name="__module.model.model.layers.13.self_attn/aten::transpose/Constant_3" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="56635488" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="1956" name="__module.model.model.layers.13.self_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2575"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> </output> </layer> <layer id="1957" name="Constant_96643" type="Const" version="opset1"> <data element_type="i64" shape="3" offset="56635704" size="24" /> <rt_info> <attribute name="precise" version="0" /> </rt_info> <output> <port id="0" precision="I64"> <dim>3</dim> </port> </output> </layer> <layer id="1958" name="__module.model.model.layers.13.self_attn/aten::view/Reshape_3" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> <port id="1" precision="I64"> <dim>3</dim> </port> </input> <output> <port id="2" precision="FP32" names="2578"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1959" name="self.model.model.layers.13.self_attn.o_proj.weight_compressed" type="Const" version="opset1"> <data element_type="f16" shape="3072, 3072" offset="3001196884" size="18874368" /> <output> <port id="0" precision="FP16" names="self.model.model.layers.13.self_attn.o_proj.weight"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1960" name="self.model.model.layers.13.self_attn.o_proj.weight" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1961" name="__module.model.model.layers.13.self_attn.o_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="2580,2582,input.79"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1962" name="__module.model.model.layers.13/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="2586,2588,2599,hidden_states.325,hidden_states.327"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1963" name="Constant_90173_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 3072" offset="3020071252" size="6144" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1964" name="Constant_90173" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1965" name="Constant_90172_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12314" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1966" name="Constant_90172" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1967" name="Constant_90170_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12316" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1968" name="Constant_90170" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1969" name="__module.model.model.layers.13.post_attention_layernorm/aten::pow/Power" type="Power" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="2589"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1970" name="Constant_14260" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="12318" size="8" /> <output> <port id="0" precision="I64" names="2590"> <dim>1</dim> </port> </output> </layer> <layer id="1971" name="__module.model.model.layers.13.post_attention_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> <data keep_dims="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="2591,variance.55"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1972" name="Constant_90171_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12326" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1973" name="Constant_90171" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1974" name="__module.model.model.layers.13.post_attention_layernorm/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="2592"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1975" name="__module.model.model.layers.13.post_attention_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1976" name="__module.model.model.layers.13.post_attention_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> <data auto_broadcast="numpy" m_pythondiv="true" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="2593"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1977" name="__module.model.model.layers.13.post_attention_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="2594,2595,hidden_states.329,hidden_states.331"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1978" name="__module.model.model.layers.13.post_attention_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="2596,2598"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1979" name="self.model.model.layers.13.mlp.gate_up_proj.weight_compressed" type="Const" version="opset1"> <data element_type="f16" shape="16384, 3072" offset="3020077396" size="100663296" /> <output> <port id="0" precision="FP16" names="self.model.model.layers.13.mlp.gate_up_proj.weight"> <dim>16384</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1980" name="self.model.model.layers.13.mlp.gate_up_proj.weight" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>16384</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>16384</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1981" name="__module.model.model.layers.13.mlp.gate_up_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>16384</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="2603,up_states.53"> <dim>-1</dim> <dim>-1</dim> <dim>16384</dim> </port> </output> </layer> <layer id="1982" name="__module.model.model.layers.13.mlp/prim::ListUnpack/VariadicSplit" type="VariadicSplit" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16384</dim> </port> <port id="1" precision="I64" /> <port id="2" precision="I32"> <dim>2</dim> </port> </input> <output> <port id="3" precision="FP32" names="2605,input.81"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> <port id="4" precision="FP32" names="2606,up_states.55"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> </output> </layer> <layer id="1983" name="__module.model.model.layers.13.mlp.activation_fn/aten::silu/Swish" type="Swish" version="opset4"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> </input> <output> <port id="1" precision="FP32" names="2607"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> </output> </layer> <layer id="1984" name="__module.model.model.layers.13.mlp/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> </input> <output> <port id="2" precision="FP32" names="2608"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> </output> </layer> <layer id="1985" name="self.model.model.layers.13.mlp.down_proj.weight_compressed" type="Const" version="opset1"> <data element_type="f16" shape="3072, 8192" offset="3120740692" size="50331648" /> <output> <port id="0" precision="FP16" names="self.model.model.layers.13.mlp.down_proj.weight"> <dim>3072</dim> <dim>8192</dim> </port> </output> </layer> <layer id="1986" name="self.model.model.layers.13.mlp.down_proj.weight" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>8192</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>3072</dim> <dim>8192</dim> </port> </output> </layer> <layer id="1987" name="__module.model.model.layers.13.mlp.down_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> <port id="1" precision="FP32"> <dim>3072</dim> <dim>8192</dim> </port> </input> <output> <port id="2" precision="FP32" names="2610,input.83"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1988" name="__module.model.model.layers.13/aten::add/Add_1" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="2612,2614,2622,2633,hidden_states.335,hidden_states.337"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1989" name="Constant_90177_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 3072" offset="3171072340" size="6144" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1990" name="Constant_90177" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1991" name="Constant_90176_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12314" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1992" name="Constant_90176" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1993" name="Constant_90174_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12316" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1994" name="Constant_90174" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1995" name="__module.model.model.layers.14.input_layernorm/aten::pow/Power" type="Power" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="2623"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="1996" name="Constant_14329" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="12318" size="8" /> <output> <port id="0" precision="I64" names="2624"> <dim>1</dim> </port> </output> </layer> <layer id="1997" name="__module.model.model.layers.14.input_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> <data keep_dims="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="2625,variance.57"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1998" name="Constant_90175_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12326" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="1999" name="Constant_90175" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2000" name="__module.model.model.layers.14.input_layernorm/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="2626"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2001" name="__module.model.model.layers.14.input_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2002" name="__module.model.model.layers.14.input_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> <data auto_broadcast="numpy" m_pythondiv="true" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="2627"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2003" name="__module.model.model.layers.14.input_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="2628,2629,hidden_states.339,hidden_states.341"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2004" name="__module.model.model.layers.14.input_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="2630,2632,hidden_states.343"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2005" name="self.model.model.layers.14.self_attn.qkv_proj.weight_compressed" type="Const" version="opset1"> <data element_type="f16" shape="9216, 3072" offset="3171078484" size="56623104" /> <output> <port id="0" precision="FP16" names="self.model.model.layers.14.self_attn.qkv_proj.weight"> <dim>9216</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2006" name="self.model.model.layers.14.self_attn.qkv_proj.weight" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>9216</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>9216</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2007" name="__module.model.model.layers.14.self_attn.qkv_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>9216</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="2639,qkv.29"> <dim>-1</dim> <dim>-1</dim> <dim>9216</dim> </port> </output> </layer> <layer id="2008" name="Constant_14372" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="2" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2009" name="Constant_14374" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635432" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2010" name="Constant_14376" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2011" name="__module.model.model.layers.14.self_attn/aten::slice/Slice" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>9216</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="2640,query_states.29"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2012" name="Constant_96644" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="56635456" size="32" /> <rt_info> <attribute name="precise" version="0" /> </rt_info> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="2013" name="__module.model.model.layers.14.self_attn/aten::view/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2644"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> </output> </layer> <layer id="2014" name="__module.model.model.layers.14.self_attn/aten::transpose/Constant" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="56635488" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="2015" name="__module.model.model.layers.14.self_attn/aten::transpose/Transpose" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2645,q.29"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="2016" name="__module.model.model.layers.14.self_attn/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="2694"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="2017" name="Constant_14939" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635630" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2018" name="Constant_14941" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635638" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2019" name="Constant_14943" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2020" name="__module.model.model.layers.14.self_attn/aten::slice/Slice_1" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="2704,x2.57"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="2021" name="Constant_90178_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1, 1" offset="56635654" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2022" name="Constant_90178" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2023" name="__module.model.model.layers.14.self_attn/aten::neg/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="2705"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="2024" name="Constant_14836" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="2" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2025" name="Constant_14880" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635630" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2026" name="Constant_14882" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2027" name="__module.model.model.layers.14.self_attn/aten::slice/Slice_2" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="2699"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="2028" name="__module.model.model.layers.14.self_attn/aten::cat/Concat" type="Concat" version="opset1"> <data axis="-1" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </input> <output> <port id="2" precision="FP32" names="2707"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="2029" name="__module.model.model.layers.14.self_attn/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="2708"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="2030" name="__module.model.model.layers.14.self_attn/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="2709"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="2031" name="Constant_102554_compressed" type="Const" version="opset1"> <data element_type="f16" shape="" offset="0" size="2" /> <output> <port id="0" precision="FP16" /> </output> </layer> <layer id="2032" name="Constant_102554" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16" /> </input> <output> <port id="1" precision="FP32" /> </output> </layer> <layer id="2033" name="Constant_102547" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="10" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2034" name="Constant_102549" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="2" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2035" name="Constant_102551" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="18" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2036" name="Concat_102552" type="Concat" version="opset1"> <data axis="0" /> <input> <port id="0" precision="I64"> <dim>1</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="4" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="2037" name="Broadcast_102555" type="Broadcast" version="opset3"> <data mode="numpy" /> <input> <port id="0" precision="FP32" /> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>0</dim> <dim>96</dim> </port> </output> </layer> <layer id="2038" name="ReadValue_101071" type="ReadValue" version="opset6"> <data variable_id="past_key_values.14.keypresent.14.key" variable_type="f32" variable_shape="?,32,?,96" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>0</dim> <dim>96</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.14.key"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="2039" name="Constant_99935" type="Const" version="opset1"> <data element_type="i64" shape="" offset="2" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="2040" name="Gather_99936" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="2041" name="Constant_14382" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635432" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2042" name="Constant_14384" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635656" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2043" name="Constant_14386" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2044" name="__module.model.model.layers.14.self_attn/aten::slice/Slice_3" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>9216</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="2641,key_states.61"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2045" name="Constant_96645" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="56635456" size="32" /> <rt_info> <attribute name="precise" version="0" /> </rt_info> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="2046" name="__module.model.model.layers.14.self_attn/aten::view/Reshape_1" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2647"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> </output> </layer> <layer id="2047" name="__module.model.model.layers.14.self_attn/aten::transpose/Constant_1" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="56635488" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="2048" name="__module.model.model.layers.14.self_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2648,key_states.63"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="2049" name="__module.model.model.layers.14.self_attn/aten::mul/Multiply_2" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="2710"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="2050" name="Constant_15082" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635630" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2051" name="Constant_15084" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635638" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2052" name="Constant_15086" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2053" name="__module.model.model.layers.14.self_attn/aten::slice/Slice_4" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="2720,x2.59"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="2054" name="Constant_90179_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1, 1" offset="56635654" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2055" name="Constant_90179" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2056" name="__module.model.model.layers.14.self_attn/aten::neg/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="2721"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="2057" name="Constant_14979" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="2" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2058" name="Constant_15023" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635630" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2059" name="Constant_15025" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2060" name="__module.model.model.layers.14.self_attn/aten::slice/Slice_5" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="2715"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="2061" name="__module.model.model.layers.14.self_attn/aten::cat/Concat_1" type="Concat" version="opset1"> <data axis="-1" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </input> <output> <port id="2" precision="FP32" names="2723"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="2062" name="__module.model.model.layers.14.self_attn/aten::mul/Multiply_3" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="2724"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="2063" name="__module.model.model.layers.14.self_attn/aten::add/Add_1" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="2725"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="2064" name="__module.model.model.layers.14.self_attn/aten::cat/Concat_2" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="hidden_states.345,present.14.key"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="2065" name="Constant_102542_compressed" type="Const" version="opset1"> <data element_type="f16" shape="" offset="0" size="2" /> <output> <port id="0" precision="FP16" /> </output> </layer> <layer id="2066" name="Constant_102542" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16" /> </input> <output> <port id="1" precision="FP32" /> </output> </layer> <layer id="2067" name="Constant_102535" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="10" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2068" name="Constant_102537" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="2" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2069" name="Constant_102539" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="18" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2070" name="Concat_102540" type="Concat" version="opset1"> <data axis="0" /> <input> <port id="0" precision="I64"> <dim>1</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="4" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="2071" name="Broadcast_102543" type="Broadcast" version="opset3"> <data mode="numpy" /> <input> <port id="0" precision="FP32" /> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>0</dim> <dim>96</dim> </port> </output> </layer> <layer id="2072" name="ReadValue_101073" type="ReadValue" version="opset6"> <data variable_id="past_key_values.14.valuepresent.14.value" variable_type="f32" variable_shape="?,32,?,96" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>0</dim> <dim>96</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.14.value"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="2073" name="Constant_99938" type="Const" version="opset1"> <data element_type="i64" shape="" offset="2" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="2074" name="Gather_99939" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="2075" name="Constant_14392" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635656" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2076" name="Constant_14394" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635638" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2077" name="Constant_14396" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2078" name="__module.model.model.layers.14.self_attn/aten::slice/Slice_6" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>9216</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="2642,value_states.29"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2079" name="Constant_96646" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="56635456" size="32" /> <rt_info> <attribute name="precise" version="0" /> </rt_info> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="2080" name="__module.model.model.layers.14.self_attn/aten::view/Reshape_2" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2650"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> </output> </layer> <layer id="2081" name="__module.model.model.layers.14.self_attn/aten::transpose/Constant_2" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="56635488" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="2082" name="__module.model.model.layers.14.self_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2651"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="2083" name="__module.model.model.layers.14.self_attn/aten::cat/Concat_3" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="hidden_states.347,present.14.value"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="2084" name="__module.model.model.layers.14.self_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> <data causal="false" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="2" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="3" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>-1</dim> </port> </input> <output> <port id="4" precision="FP32" names="2735,attn_output.57"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="2085" name="__module.model.model.layers.14.self_attn/aten::transpose/Constant_3" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="56635488" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="2086" name="__module.model.model.layers.14.self_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2736"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> </output> </layer> <layer id="2087" name="Constant_96647" type="Const" version="opset1"> <data element_type="i64" shape="3" offset="56635704" size="24" /> <rt_info> <attribute name="precise" version="0" /> </rt_info> <output> <port id="0" precision="I64"> <dim>3</dim> </port> </output> </layer> <layer id="2088" name="__module.model.model.layers.14.self_attn/aten::view/Reshape_3" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> <port id="1" precision="I64"> <dim>3</dim> </port> </input> <output> <port id="2" precision="FP32" names="2739"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2089" name="self.model.model.layers.14.self_attn.o_proj.weight_compressed" type="Const" version="opset1"> <data element_type="f16" shape="3072, 3072" offset="3227701588" size="18874368" /> <output> <port id="0" precision="FP16" names="self.model.model.layers.14.self_attn.o_proj.weight"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2090" name="self.model.model.layers.14.self_attn.o_proj.weight" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2091" name="__module.model.model.layers.14.self_attn.o_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="2741,2743,input.85"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2092" name="__module.model.model.layers.14/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="2747,2749,2760,hidden_states.349,hidden_states.351"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2093" name="Constant_90183_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 3072" offset="3246575956" size="6144" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2094" name="Constant_90183" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2095" name="Constant_90182_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12314" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2096" name="Constant_90182" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2097" name="Constant_90180_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12316" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2098" name="Constant_90180" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2099" name="__module.model.model.layers.14.post_attention_layernorm/aten::pow/Power" type="Power" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="2750"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2100" name="Constant_15254" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="12318" size="8" /> <output> <port id="0" precision="I64" names="2751"> <dim>1</dim> </port> </output> </layer> <layer id="2101" name="__module.model.model.layers.14.post_attention_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> <data keep_dims="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="2752,variance.59"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2102" name="Constant_90181_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12326" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2103" name="Constant_90181" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2104" name="__module.model.model.layers.14.post_attention_layernorm/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="2753"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2105" name="__module.model.model.layers.14.post_attention_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2106" name="__module.model.model.layers.14.post_attention_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> <data auto_broadcast="numpy" m_pythondiv="true" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="2754"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2107" name="__module.model.model.layers.14.post_attention_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="2755,2756,hidden_states.353,hidden_states.355"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2108" name="__module.model.model.layers.14.post_attention_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="2757,2759"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2109" name="self.model.model.layers.14.mlp.gate_up_proj.weight_compressed" type="Const" version="opset1"> <data element_type="f16" shape="16384, 3072" offset="3246582100" size="100663296" /> <output> <port id="0" precision="FP16" names="self.model.model.layers.14.mlp.gate_up_proj.weight"> <dim>16384</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2110" name="self.model.model.layers.14.mlp.gate_up_proj.weight" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>16384</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>16384</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2111" name="__module.model.model.layers.14.mlp.gate_up_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>16384</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="2764,up_states.57"> <dim>-1</dim> <dim>-1</dim> <dim>16384</dim> </port> </output> </layer> <layer id="2112" name="__module.model.model.layers.14.mlp/prim::ListUnpack/VariadicSplit" type="VariadicSplit" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16384</dim> </port> <port id="1" precision="I64" /> <port id="2" precision="I32"> <dim>2</dim> </port> </input> <output> <port id="3" precision="FP32" names="2766,input.87"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> <port id="4" precision="FP32" names="2767,up_states.59"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> </output> </layer> <layer id="2113" name="__module.model.model.layers.14.mlp.activation_fn/aten::silu/Swish" type="Swish" version="opset4"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> </input> <output> <port id="1" precision="FP32" names="2768"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> </output> </layer> <layer id="2114" name="__module.model.model.layers.14.mlp/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> </input> <output> <port id="2" precision="FP32" names="2769"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> </output> </layer> <layer id="2115" name="self.model.model.layers.14.mlp.down_proj.weight_compressed" type="Const" version="opset1"> <data element_type="f16" shape="3072, 8192" offset="3347245396" size="50331648" /> <output> <port id="0" precision="FP16" names="self.model.model.layers.14.mlp.down_proj.weight"> <dim>3072</dim> <dim>8192</dim> </port> </output> </layer> <layer id="2116" name="self.model.model.layers.14.mlp.down_proj.weight" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>8192</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>3072</dim> <dim>8192</dim> </port> </output> </layer> <layer id="2117" name="__module.model.model.layers.14.mlp.down_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> <port id="1" precision="FP32"> <dim>3072</dim> <dim>8192</dim> </port> </input> <output> <port id="2" precision="FP32" names="2771,input.89"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2118" name="__module.model.model.layers.14/aten::add/Add_1" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="2773,2775,2783,2794,hidden_states.359,hidden_states.361"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2119" name="Constant_90187_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 3072" offset="3397577044" size="6144" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2120" name="Constant_90187" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2121" name="Constant_90186_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12314" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2122" name="Constant_90186" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2123" name="Constant_90184_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12316" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2124" name="Constant_90184" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2125" name="__module.model.model.layers.15.input_layernorm/aten::pow/Power" type="Power" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="2784"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2126" name="Constant_15323" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="12318" size="8" /> <output> <port id="0" precision="I64" names="2785"> <dim>1</dim> </port> </output> </layer> <layer id="2127" name="__module.model.model.layers.15.input_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> <data keep_dims="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="2786,variance.61"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2128" name="Constant_90185_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12326" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2129" name="Constant_90185" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2130" name="__module.model.model.layers.15.input_layernorm/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="2787"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2131" name="__module.model.model.layers.15.input_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2132" name="__module.model.model.layers.15.input_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> <data auto_broadcast="numpy" m_pythondiv="true" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="2788"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2133" name="__module.model.model.layers.15.input_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="2789,2790,hidden_states.363,hidden_states.365"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2134" name="__module.model.model.layers.15.input_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="2791,2793,hidden_states.367"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2135" name="self.model.model.layers.15.self_attn.qkv_proj.weight_compressed" type="Const" version="opset1"> <data element_type="f16" shape="9216, 3072" offset="3397583188" size="56623104" /> <output> <port id="0" precision="FP16" names="self.model.model.layers.15.self_attn.qkv_proj.weight"> <dim>9216</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2136" name="self.model.model.layers.15.self_attn.qkv_proj.weight" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>9216</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>9216</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2137" name="__module.model.model.layers.15.self_attn.qkv_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>9216</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="2800,qkv.31"> <dim>-1</dim> <dim>-1</dim> <dim>9216</dim> </port> </output> </layer> <layer id="2138" name="Constant_15366" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="2" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2139" name="Constant_15368" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635432" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2140" name="Constant_15370" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2141" name="__module.model.model.layers.15.self_attn/aten::slice/Slice" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>9216</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="2801,query_states.31"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2142" name="Constant_96648" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="56635456" size="32" /> <rt_info> <attribute name="precise" version="0" /> </rt_info> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="2143" name="__module.model.model.layers.15.self_attn/aten::view/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2805"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> </output> </layer> <layer id="2144" name="__module.model.model.layers.15.self_attn/aten::transpose/Constant" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="56635488" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="2145" name="__module.model.model.layers.15.self_attn/aten::transpose/Transpose" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2806,q.31"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="2146" name="__module.model.model.layers.15.self_attn/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="2855"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="2147" name="Constant_15933" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635630" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2148" name="Constant_15935" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635638" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2149" name="Constant_15937" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2150" name="__module.model.model.layers.15.self_attn/aten::slice/Slice_1" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="2865,x2.61"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="2151" name="Constant_90188_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1, 1" offset="56635654" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2152" name="Constant_90188" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2153" name="__module.model.model.layers.15.self_attn/aten::neg/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="2866"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="2154" name="Constant_15830" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="2" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2155" name="Constant_15874" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635630" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2156" name="Constant_15876" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2157" name="__module.model.model.layers.15.self_attn/aten::slice/Slice_2" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="2860"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="2158" name="__module.model.model.layers.15.self_attn/aten::cat/Concat" type="Concat" version="opset1"> <data axis="-1" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </input> <output> <port id="2" precision="FP32" names="2868"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="2159" name="__module.model.model.layers.15.self_attn/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="2869"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="2160" name="__module.model.model.layers.15.self_attn/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="2870"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="2161" name="Constant_102578_compressed" type="Const" version="opset1"> <data element_type="f16" shape="" offset="0" size="2" /> <output> <port id="0" precision="FP16" /> </output> </layer> <layer id="2162" name="Constant_102578" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16" /> </input> <output> <port id="1" precision="FP32" /> </output> </layer> <layer id="2163" name="Constant_102571" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="10" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2164" name="Constant_102573" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="2" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2165" name="Constant_102575" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="18" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2166" name="Concat_102576" type="Concat" version="opset1"> <data axis="0" /> <input> <port id="0" precision="I64"> <dim>1</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="4" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="2167" name="Broadcast_102579" type="Broadcast" version="opset3"> <data mode="numpy" /> <input> <port id="0" precision="FP32" /> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>0</dim> <dim>96</dim> </port> </output> </layer> <layer id="2168" name="ReadValue_101075" type="ReadValue" version="opset6"> <data variable_id="past_key_values.15.keypresent.15.key" variable_type="f32" variable_shape="?,32,?,96" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>0</dim> <dim>96</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.15.key"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="2169" name="Constant_99941" type="Const" version="opset1"> <data element_type="i64" shape="" offset="2" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="2170" name="Gather_99942" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="2171" name="Constant_15376" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635432" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2172" name="Constant_15378" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635656" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2173" name="Constant_15380" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2174" name="__module.model.model.layers.15.self_attn/aten::slice/Slice_3" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>9216</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="2802,key_states.65"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2175" name="Constant_96649" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="56635456" size="32" /> <rt_info> <attribute name="precise" version="0" /> </rt_info> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="2176" name="__module.model.model.layers.15.self_attn/aten::view/Reshape_1" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2808"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> </output> </layer> <layer id="2177" name="__module.model.model.layers.15.self_attn/aten::transpose/Constant_1" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="56635488" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="2178" name="__module.model.model.layers.15.self_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2809,key_states.67"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="2179" name="__module.model.model.layers.15.self_attn/aten::mul/Multiply_2" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="2871"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="2180" name="Constant_16076" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635630" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2181" name="Constant_16078" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635638" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2182" name="Constant_16080" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2183" name="__module.model.model.layers.15.self_attn/aten::slice/Slice_4" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="2881,x2.63"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="2184" name="Constant_90189_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1, 1" offset="56635654" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2185" name="Constant_90189" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2186" name="__module.model.model.layers.15.self_attn/aten::neg/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="2882"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="2187" name="Constant_15973" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="2" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2188" name="Constant_16017" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635630" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2189" name="Constant_16019" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2190" name="__module.model.model.layers.15.self_attn/aten::slice/Slice_5" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="2876"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="2191" name="__module.model.model.layers.15.self_attn/aten::cat/Concat_1" type="Concat" version="opset1"> <data axis="-1" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </input> <output> <port id="2" precision="FP32" names="2884"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="2192" name="__module.model.model.layers.15.self_attn/aten::mul/Multiply_3" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="2885"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="2193" name="__module.model.model.layers.15.self_attn/aten::add/Add_1" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="2886"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="2194" name="__module.model.model.layers.15.self_attn/aten::cat/Concat_2" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="hidden_states.369,present.15.key"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="2195" name="Constant_102566_compressed" type="Const" version="opset1"> <data element_type="f16" shape="" offset="0" size="2" /> <output> <port id="0" precision="FP16" /> </output> </layer> <layer id="2196" name="Constant_102566" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16" /> </input> <output> <port id="1" precision="FP32" /> </output> </layer> <layer id="2197" name="Constant_102559" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="10" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2198" name="Constant_102561" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="2" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2199" name="Constant_102563" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="18" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2200" name="Concat_102564" type="Concat" version="opset1"> <data axis="0" /> <input> <port id="0" precision="I64"> <dim>1</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="4" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="2201" name="Broadcast_102567" type="Broadcast" version="opset3"> <data mode="numpy" /> <input> <port id="0" precision="FP32" /> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>0</dim> <dim>96</dim> </port> </output> </layer> <layer id="2202" name="ReadValue_101077" type="ReadValue" version="opset6"> <data variable_id="past_key_values.15.valuepresent.15.value" variable_type="f32" variable_shape="?,32,?,96" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>0</dim> <dim>96</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.15.value"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="2203" name="Constant_99944" type="Const" version="opset1"> <data element_type="i64" shape="" offset="2" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="2204" name="Gather_99945" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="2205" name="Constant_15386" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635656" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2206" name="Constant_15388" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635638" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2207" name="Constant_15390" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2208" name="__module.model.model.layers.15.self_attn/aten::slice/Slice_6" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>9216</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="2803,value_states.31"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2209" name="Constant_96650" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="56635456" size="32" /> <rt_info> <attribute name="precise" version="0" /> </rt_info> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="2210" name="__module.model.model.layers.15.self_attn/aten::view/Reshape_2" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2811"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> </output> </layer> <layer id="2211" name="__module.model.model.layers.15.self_attn/aten::transpose/Constant_2" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="56635488" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="2212" name="__module.model.model.layers.15.self_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2812"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="2213" name="__module.model.model.layers.15.self_attn/aten::cat/Concat_3" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="hidden_states.371,present.15.value"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="2214" name="__module.model.model.layers.15.self_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> <data causal="false" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="2" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="3" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>-1</dim> </port> </input> <output> <port id="4" precision="FP32" names="2896,attn_output.61"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="2215" name="__module.model.model.layers.15.self_attn/aten::transpose/Constant_3" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="56635488" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="2216" name="__module.model.model.layers.15.self_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2897"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> </output> </layer> <layer id="2217" name="Constant_96651" type="Const" version="opset1"> <data element_type="i64" shape="3" offset="56635704" size="24" /> <rt_info> <attribute name="precise" version="0" /> </rt_info> <output> <port id="0" precision="I64"> <dim>3</dim> </port> </output> </layer> <layer id="2218" name="__module.model.model.layers.15.self_attn/aten::view/Reshape_3" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> <port id="1" precision="I64"> <dim>3</dim> </port> </input> <output> <port id="2" precision="FP32" names="2900"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2219" name="self.model.model.layers.15.self_attn.o_proj.weight_compressed" type="Const" version="opset1"> <data element_type="f16" shape="3072, 3072" offset="3454206292" size="18874368" /> <output> <port id="0" precision="FP16" names="self.model.model.layers.15.self_attn.o_proj.weight"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2220" name="self.model.model.layers.15.self_attn.o_proj.weight" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2221" name="__module.model.model.layers.15.self_attn.o_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="2902,2904,input.91"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2222" name="__module.model.model.layers.15/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="2908,2910,2921,hidden_states.373,hidden_states.375"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2223" name="Constant_90193_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 3072" offset="3473080660" size="6144" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2224" name="Constant_90193" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2225" name="Constant_90192_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12314" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2226" name="Constant_90192" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2227" name="Constant_90190_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12316" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2228" name="Constant_90190" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2229" name="__module.model.model.layers.15.post_attention_layernorm/aten::pow/Power" type="Power" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="2911"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2230" name="Constant_16248" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="12318" size="8" /> <output> <port id="0" precision="I64" names="2912"> <dim>1</dim> </port> </output> </layer> <layer id="2231" name="__module.model.model.layers.15.post_attention_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> <data keep_dims="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="2913,variance.63"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2232" name="Constant_90191_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12326" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2233" name="Constant_90191" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2234" name="__module.model.model.layers.15.post_attention_layernorm/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="2914"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2235" name="__module.model.model.layers.15.post_attention_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2236" name="__module.model.model.layers.15.post_attention_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> <data auto_broadcast="numpy" m_pythondiv="true" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="2915"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2237" name="__module.model.model.layers.15.post_attention_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="2916,2917,hidden_states.377,hidden_states.379"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2238" name="__module.model.model.layers.15.post_attention_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="2918,2920"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2239" name="self.model.model.layers.15.mlp.gate_up_proj.weight_compressed" type="Const" version="opset1"> <data element_type="f16" shape="16384, 3072" offset="3473086804" size="100663296" /> <output> <port id="0" precision="FP16" names="self.model.model.layers.15.mlp.gate_up_proj.weight"> <dim>16384</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2240" name="self.model.model.layers.15.mlp.gate_up_proj.weight" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>16384</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>16384</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2241" name="__module.model.model.layers.15.mlp.gate_up_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>16384</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="2925,up_states.61"> <dim>-1</dim> <dim>-1</dim> <dim>16384</dim> </port> </output> </layer> <layer id="2242" name="__module.model.model.layers.15.mlp/prim::ListUnpack/VariadicSplit" type="VariadicSplit" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16384</dim> </port> <port id="1" precision="I64" /> <port id="2" precision="I32"> <dim>2</dim> </port> </input> <output> <port id="3" precision="FP32" names="2927,input.93"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> <port id="4" precision="FP32" names="2928,up_states.63"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> </output> </layer> <layer id="2243" name="__module.model.model.layers.15.mlp.activation_fn/aten::silu/Swish" type="Swish" version="opset4"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> </input> <output> <port id="1" precision="FP32" names="2929"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> </output> </layer> <layer id="2244" name="__module.model.model.layers.15.mlp/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> </input> <output> <port id="2" precision="FP32" names="2930"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> </output> </layer> <layer id="2245" name="self.model.model.layers.15.mlp.down_proj.weight_compressed" type="Const" version="opset1"> <data element_type="f16" shape="3072, 8192" offset="3573750100" size="50331648" /> <output> <port id="0" precision="FP16" names="self.model.model.layers.15.mlp.down_proj.weight"> <dim>3072</dim> <dim>8192</dim> </port> </output> </layer> <layer id="2246" name="self.model.model.layers.15.mlp.down_proj.weight" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>8192</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>3072</dim> <dim>8192</dim> </port> </output> </layer> <layer id="2247" name="__module.model.model.layers.15.mlp.down_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> <port id="1" precision="FP32"> <dim>3072</dim> <dim>8192</dim> </port> </input> <output> <port id="2" precision="FP32" names="2932,input.95"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2248" name="__module.model.model.layers.15/aten::add/Add_1" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="2934,2936,2944,2955,hidden_states.383,hidden_states.385"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2249" name="Constant_90197_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 3072" offset="3624081748" size="6144" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2250" name="Constant_90197" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2251" name="Constant_90196_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12314" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2252" name="Constant_90196" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2253" name="Constant_90194_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12316" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2254" name="Constant_90194" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2255" name="__module.model.model.layers.16.input_layernorm/aten::pow/Power" type="Power" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="2945"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2256" name="Constant_16317" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="12318" size="8" /> <output> <port id="0" precision="I64" names="2946"> <dim>1</dim> </port> </output> </layer> <layer id="2257" name="__module.model.model.layers.16.input_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> <data keep_dims="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="2947,variance.65"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2258" name="Constant_90195_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12326" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2259" name="Constant_90195" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2260" name="__module.model.model.layers.16.input_layernorm/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="2948"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2261" name="__module.model.model.layers.16.input_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2262" name="__module.model.model.layers.16.input_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> <data auto_broadcast="numpy" m_pythondiv="true" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="2949"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2263" name="__module.model.model.layers.16.input_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="2950,2951,hidden_states.387,hidden_states.389"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2264" name="__module.model.model.layers.16.input_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="2952,2954,hidden_states.391"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2265" name="self.model.model.layers.16.self_attn.qkv_proj.weight_compressed" type="Const" version="opset1"> <data element_type="f16" shape="9216, 3072" offset="3624087892" size="56623104" /> <output> <port id="0" precision="FP16" names="self.model.model.layers.16.self_attn.qkv_proj.weight"> <dim>9216</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2266" name="self.model.model.layers.16.self_attn.qkv_proj.weight" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>9216</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>9216</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2267" name="__module.model.model.layers.16.self_attn.qkv_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>9216</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="2961,qkv.33"> <dim>-1</dim> <dim>-1</dim> <dim>9216</dim> </port> </output> </layer> <layer id="2268" name="Constant_16360" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="2" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2269" name="Constant_16362" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635432" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2270" name="Constant_16364" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2271" name="__module.model.model.layers.16.self_attn/aten::slice/Slice" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>9216</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="2962,query_states.33"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2272" name="Constant_96652" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="56635456" size="32" /> <rt_info> <attribute name="precise" version="0" /> </rt_info> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="2273" name="__module.model.model.layers.16.self_attn/aten::view/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2966"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> </output> </layer> <layer id="2274" name="__module.model.model.layers.16.self_attn/aten::transpose/Constant" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="56635488" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="2275" name="__module.model.model.layers.16.self_attn/aten::transpose/Transpose" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2967,q.33"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="2276" name="__module.model.model.layers.16.self_attn/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="3016"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="2277" name="Constant_16927" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635630" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2278" name="Constant_16929" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635638" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2279" name="Constant_16931" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2280" name="__module.model.model.layers.16.self_attn/aten::slice/Slice_1" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="3026,x2.65"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="2281" name="Constant_90198_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1, 1" offset="56635654" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2282" name="Constant_90198" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2283" name="__module.model.model.layers.16.self_attn/aten::neg/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="3027"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="2284" name="Constant_16824" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="2" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2285" name="Constant_16868" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635630" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2286" name="Constant_16870" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2287" name="__module.model.model.layers.16.self_attn/aten::slice/Slice_2" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="3021"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="2288" name="__module.model.model.layers.16.self_attn/aten::cat/Concat" type="Concat" version="opset1"> <data axis="-1" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </input> <output> <port id="2" precision="FP32" names="3029"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="2289" name="__module.model.model.layers.16.self_attn/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="3030"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="2290" name="__module.model.model.layers.16.self_attn/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="3031"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="2291" name="Constant_102602_compressed" type="Const" version="opset1"> <data element_type="f16" shape="" offset="0" size="2" /> <output> <port id="0" precision="FP16" /> </output> </layer> <layer id="2292" name="Constant_102602" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16" /> </input> <output> <port id="1" precision="FP32" /> </output> </layer> <layer id="2293" name="Constant_102595" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="10" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2294" name="Constant_102597" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="2" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2295" name="Constant_102599" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="18" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2296" name="Concat_102600" type="Concat" version="opset1"> <data axis="0" /> <input> <port id="0" precision="I64"> <dim>1</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="4" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="2297" name="Broadcast_102603" type="Broadcast" version="opset3"> <data mode="numpy" /> <input> <port id="0" precision="FP32" /> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>0</dim> <dim>96</dim> </port> </output> </layer> <layer id="2298" name="ReadValue_101079" type="ReadValue" version="opset6"> <data variable_id="past_key_values.16.keypresent.16.key" variable_type="f32" variable_shape="?,32,?,96" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>0</dim> <dim>96</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.16.key"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="2299" name="Constant_99947" type="Const" version="opset1"> <data element_type="i64" shape="" offset="2" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="2300" name="Gather_99948" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="2301" name="Constant_16370" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635432" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2302" name="Constant_16372" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635656" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2303" name="Constant_16374" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2304" name="__module.model.model.layers.16.self_attn/aten::slice/Slice_3" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>9216</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="2963,key_states.69"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2305" name="Constant_96653" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="56635456" size="32" /> <rt_info> <attribute name="precise" version="0" /> </rt_info> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="2306" name="__module.model.model.layers.16.self_attn/aten::view/Reshape_1" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2969"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> </output> </layer> <layer id="2307" name="__module.model.model.layers.16.self_attn/aten::transpose/Constant_1" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="56635488" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="2308" name="__module.model.model.layers.16.self_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2970,key_states.71"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="2309" name="__module.model.model.layers.16.self_attn/aten::mul/Multiply_2" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="3032"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="2310" name="Constant_17070" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635630" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2311" name="Constant_17072" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635638" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2312" name="Constant_17074" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2313" name="__module.model.model.layers.16.self_attn/aten::slice/Slice_4" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="3042,x2.67"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="2314" name="Constant_90199_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1, 1" offset="56635654" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2315" name="Constant_90199" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2316" name="__module.model.model.layers.16.self_attn/aten::neg/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="3043"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="2317" name="Constant_16967" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="2" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2318" name="Constant_17011" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635630" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2319" name="Constant_17013" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2320" name="__module.model.model.layers.16.self_attn/aten::slice/Slice_5" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="3037"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="2321" name="__module.model.model.layers.16.self_attn/aten::cat/Concat_1" type="Concat" version="opset1"> <data axis="-1" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </input> <output> <port id="2" precision="FP32" names="3045"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="2322" name="__module.model.model.layers.16.self_attn/aten::mul/Multiply_3" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="3046"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="2323" name="__module.model.model.layers.16.self_attn/aten::add/Add_1" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="3047"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="2324" name="__module.model.model.layers.16.self_attn/aten::cat/Concat_2" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="hidden_states.393,present.16.key"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="2325" name="Constant_102590_compressed" type="Const" version="opset1"> <data element_type="f16" shape="" offset="0" size="2" /> <output> <port id="0" precision="FP16" /> </output> </layer> <layer id="2326" name="Constant_102590" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16" /> </input> <output> <port id="1" precision="FP32" /> </output> </layer> <layer id="2327" name="Constant_102583" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="10" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2328" name="Constant_102585" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="2" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2329" name="Constant_102587" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="18" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2330" name="Concat_102588" type="Concat" version="opset1"> <data axis="0" /> <input> <port id="0" precision="I64"> <dim>1</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="4" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="2331" name="Broadcast_102591" type="Broadcast" version="opset3"> <data mode="numpy" /> <input> <port id="0" precision="FP32" /> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>0</dim> <dim>96</dim> </port> </output> </layer> <layer id="2332" name="ReadValue_101081" type="ReadValue" version="opset6"> <data variable_id="past_key_values.16.valuepresent.16.value" variable_type="f32" variable_shape="?,32,?,96" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>0</dim> <dim>96</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.16.value"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="2333" name="Constant_99950" type="Const" version="opset1"> <data element_type="i64" shape="" offset="2" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="2334" name="Gather_99951" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="2335" name="Constant_16380" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635656" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2336" name="Constant_16382" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635638" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2337" name="Constant_16384" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2338" name="__module.model.model.layers.16.self_attn/aten::slice/Slice_6" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>9216</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="2964,value_states.33"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2339" name="Constant_96654" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="56635456" size="32" /> <rt_info> <attribute name="precise" version="0" /> </rt_info> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="2340" name="__module.model.model.layers.16.self_attn/aten::view/Reshape_2" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2972"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> </output> </layer> <layer id="2341" name="__module.model.model.layers.16.self_attn/aten::transpose/Constant_2" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="56635488" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="2342" name="__module.model.model.layers.16.self_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="2973"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="2343" name="__module.model.model.layers.16.self_attn/aten::cat/Concat_3" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="hidden_states.395,present.16.value"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="2344" name="__module.model.model.layers.16.self_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> <data causal="false" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="2" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="3" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>-1</dim> </port> </input> <output> <port id="4" precision="FP32" names="3057,attn_output.65"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="2345" name="__module.model.model.layers.16.self_attn/aten::transpose/Constant_3" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="56635488" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="2346" name="__module.model.model.layers.16.self_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="3058"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> </output> </layer> <layer id="2347" name="Constant_96655" type="Const" version="opset1"> <data element_type="i64" shape="3" offset="56635704" size="24" /> <rt_info> <attribute name="precise" version="0" /> </rt_info> <output> <port id="0" precision="I64"> <dim>3</dim> </port> </output> </layer> <layer id="2348" name="__module.model.model.layers.16.self_attn/aten::view/Reshape_3" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> <port id="1" precision="I64"> <dim>3</dim> </port> </input> <output> <port id="2" precision="FP32" names="3061"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2349" name="self.model.model.layers.16.self_attn.o_proj.weight_compressed" type="Const" version="opset1"> <data element_type="f16" shape="3072, 3072" offset="3680710996" size="18874368" /> <output> <port id="0" precision="FP16" names="self.model.model.layers.16.self_attn.o_proj.weight"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2350" name="self.model.model.layers.16.self_attn.o_proj.weight" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2351" name="__module.model.model.layers.16.self_attn.o_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="3063,3065,input.97"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2352" name="__module.model.model.layers.16/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="3069,3071,3082,hidden_states.397,hidden_states.399"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2353" name="Constant_90203_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 3072" offset="3699585364" size="6144" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2354" name="Constant_90203" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2355" name="Constant_90202_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12314" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2356" name="Constant_90202" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2357" name="Constant_90200_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12316" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2358" name="Constant_90200" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2359" name="__module.model.model.layers.16.post_attention_layernorm/aten::pow/Power" type="Power" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="3072"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2360" name="Constant_17242" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="12318" size="8" /> <output> <port id="0" precision="I64" names="3073"> <dim>1</dim> </port> </output> </layer> <layer id="2361" name="__module.model.model.layers.16.post_attention_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> <data keep_dims="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="3074,variance.67"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2362" name="Constant_90201_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12326" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2363" name="Constant_90201" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2364" name="__module.model.model.layers.16.post_attention_layernorm/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="3075"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2365" name="__module.model.model.layers.16.post_attention_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2366" name="__module.model.model.layers.16.post_attention_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> <data auto_broadcast="numpy" m_pythondiv="true" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="3076"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2367" name="__module.model.model.layers.16.post_attention_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="3077,3078,hidden_states.401,hidden_states.403"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2368" name="__module.model.model.layers.16.post_attention_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="3079,3081"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2369" name="self.model.model.layers.16.mlp.gate_up_proj.weight_compressed" type="Const" version="opset1"> <data element_type="f16" shape="16384, 3072" offset="3699591508" size="100663296" /> <output> <port id="0" precision="FP16" names="self.model.model.layers.16.mlp.gate_up_proj.weight"> <dim>16384</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2370" name="self.model.model.layers.16.mlp.gate_up_proj.weight" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>16384</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>16384</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2371" name="__module.model.model.layers.16.mlp.gate_up_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>16384</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="3086,up_states.65"> <dim>-1</dim> <dim>-1</dim> <dim>16384</dim> </port> </output> </layer> <layer id="2372" name="__module.model.model.layers.16.mlp/prim::ListUnpack/VariadicSplit" type="VariadicSplit" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16384</dim> </port> <port id="1" precision="I64" /> <port id="2" precision="I32"> <dim>2</dim> </port> </input> <output> <port id="3" precision="FP32" names="3088,input.99"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> <port id="4" precision="FP32" names="3089,up_states.67"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> </output> </layer> <layer id="2373" name="__module.model.model.layers.16.mlp.activation_fn/aten::silu/Swish" type="Swish" version="opset4"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> </input> <output> <port id="1" precision="FP32" names="3090"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> </output> </layer> <layer id="2374" name="__module.model.model.layers.16.mlp/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> </input> <output> <port id="2" precision="FP32" names="3091"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> </output> </layer> <layer id="2375" name="self.model.model.layers.16.mlp.down_proj.weight_compressed" type="Const" version="opset1"> <data element_type="f16" shape="3072, 8192" offset="3800254804" size="50331648" /> <output> <port id="0" precision="FP16" names="self.model.model.layers.16.mlp.down_proj.weight"> <dim>3072</dim> <dim>8192</dim> </port> </output> </layer> <layer id="2376" name="self.model.model.layers.16.mlp.down_proj.weight" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>8192</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>3072</dim> <dim>8192</dim> </port> </output> </layer> <layer id="2377" name="__module.model.model.layers.16.mlp.down_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> <port id="1" precision="FP32"> <dim>3072</dim> <dim>8192</dim> </port> </input> <output> <port id="2" precision="FP32" names="3093,input.101"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2378" name="__module.model.model.layers.16/aten::add/Add_1" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="3095,3097,3105,3116,hidden_states.407,hidden_states.409"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2379" name="Constant_90207_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 3072" offset="3850586452" size="6144" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2380" name="Constant_90207" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2381" name="Constant_90206_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12314" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2382" name="Constant_90206" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2383" name="Constant_90204_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12316" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2384" name="Constant_90204" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2385" name="__module.model.model.layers.17.input_layernorm/aten::pow/Power" type="Power" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="3106"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2386" name="Constant_17311" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="12318" size="8" /> <output> <port id="0" precision="I64" names="3107"> <dim>1</dim> </port> </output> </layer> <layer id="2387" name="__module.model.model.layers.17.input_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> <data keep_dims="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="3108,variance.69"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2388" name="Constant_90205_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12326" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2389" name="Constant_90205" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2390" name="__module.model.model.layers.17.input_layernorm/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="3109"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2391" name="__module.model.model.layers.17.input_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2392" name="__module.model.model.layers.17.input_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> <data auto_broadcast="numpy" m_pythondiv="true" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="3110"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2393" name="__module.model.model.layers.17.input_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="3111,3112,hidden_states.411,hidden_states.413"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2394" name="__module.model.model.layers.17.input_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="3113,3115,hidden_states.415"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2395" name="self.model.model.layers.17.self_attn.qkv_proj.weight_compressed" type="Const" version="opset1"> <data element_type="f16" shape="9216, 3072" offset="3850592596" size="56623104" /> <output> <port id="0" precision="FP16" names="self.model.model.layers.17.self_attn.qkv_proj.weight"> <dim>9216</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2396" name="self.model.model.layers.17.self_attn.qkv_proj.weight" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>9216</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>9216</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2397" name="__module.model.model.layers.17.self_attn.qkv_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>9216</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="3122,qkv.35"> <dim>-1</dim> <dim>-1</dim> <dim>9216</dim> </port> </output> </layer> <layer id="2398" name="Constant_17354" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="2" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2399" name="Constant_17356" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635432" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2400" name="Constant_17358" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2401" name="__module.model.model.layers.17.self_attn/aten::slice/Slice" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>9216</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="3123,query_states.35"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2402" name="Constant_96656" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="56635456" size="32" /> <rt_info> <attribute name="precise" version="0" /> </rt_info> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="2403" name="__module.model.model.layers.17.self_attn/aten::view/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="3127"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> </output> </layer> <layer id="2404" name="__module.model.model.layers.17.self_attn/aten::transpose/Constant" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="56635488" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="2405" name="__module.model.model.layers.17.self_attn/aten::transpose/Transpose" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="3128,q.35"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="2406" name="__module.model.model.layers.17.self_attn/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="3177"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="2407" name="Constant_17921" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635630" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2408" name="Constant_17923" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635638" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2409" name="Constant_17925" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2410" name="__module.model.model.layers.17.self_attn/aten::slice/Slice_1" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="3187,x2.69"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="2411" name="Constant_90208_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1, 1" offset="56635654" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2412" name="Constant_90208" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2413" name="__module.model.model.layers.17.self_attn/aten::neg/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="3188"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="2414" name="Constant_17818" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="2" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2415" name="Constant_17862" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635630" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2416" name="Constant_17864" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2417" name="__module.model.model.layers.17.self_attn/aten::slice/Slice_2" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="3182"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="2418" name="__module.model.model.layers.17.self_attn/aten::cat/Concat" type="Concat" version="opset1"> <data axis="-1" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </input> <output> <port id="2" precision="FP32" names="3190"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="2419" name="__module.model.model.layers.17.self_attn/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="3191"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="2420" name="__module.model.model.layers.17.self_attn/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="3192"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="2421" name="Constant_102626_compressed" type="Const" version="opset1"> <data element_type="f16" shape="" offset="0" size="2" /> <output> <port id="0" precision="FP16" /> </output> </layer> <layer id="2422" name="Constant_102626" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16" /> </input> <output> <port id="1" precision="FP32" /> </output> </layer> <layer id="2423" name="Constant_102619" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="10" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2424" name="Constant_102621" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="2" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2425" name="Constant_102623" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="18" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2426" name="Concat_102624" type="Concat" version="opset1"> <data axis="0" /> <input> <port id="0" precision="I64"> <dim>1</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="4" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="2427" name="Broadcast_102627" type="Broadcast" version="opset3"> <data mode="numpy" /> <input> <port id="0" precision="FP32" /> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>0</dim> <dim>96</dim> </port> </output> </layer> <layer id="2428" name="ReadValue_101083" type="ReadValue" version="opset6"> <data variable_id="past_key_values.17.keypresent.17.key" variable_type="f32" variable_shape="?,32,?,96" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>0</dim> <dim>96</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.17.key"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="2429" name="Constant_99953" type="Const" version="opset1"> <data element_type="i64" shape="" offset="2" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="2430" name="Gather_99954" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="2431" name="Constant_17364" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635432" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2432" name="Constant_17366" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635656" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2433" name="Constant_17368" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2434" name="__module.model.model.layers.17.self_attn/aten::slice/Slice_3" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>9216</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="3124,key_states.73"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2435" name="Constant_96657" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="56635456" size="32" /> <rt_info> <attribute name="precise" version="0" /> </rt_info> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="2436" name="__module.model.model.layers.17.self_attn/aten::view/Reshape_1" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="3130"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> </output> </layer> <layer id="2437" name="__module.model.model.layers.17.self_attn/aten::transpose/Constant_1" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="56635488" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="2438" name="__module.model.model.layers.17.self_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="3131,key_states.75"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="2439" name="__module.model.model.layers.17.self_attn/aten::mul/Multiply_2" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="3193"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="2440" name="Constant_18064" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635630" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2441" name="Constant_18066" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635638" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2442" name="Constant_18068" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2443" name="__module.model.model.layers.17.self_attn/aten::slice/Slice_4" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="3203,x2.71"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="2444" name="Constant_90209_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1, 1" offset="56635654" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2445" name="Constant_90209" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2446" name="__module.model.model.layers.17.self_attn/aten::neg/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="3204"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="2447" name="Constant_17961" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="2" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2448" name="Constant_18005" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635630" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2449" name="Constant_18007" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2450" name="__module.model.model.layers.17.self_attn/aten::slice/Slice_5" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="3198"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="2451" name="__module.model.model.layers.17.self_attn/aten::cat/Concat_1" type="Concat" version="opset1"> <data axis="-1" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </input> <output> <port id="2" precision="FP32" names="3206"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="2452" name="__module.model.model.layers.17.self_attn/aten::mul/Multiply_3" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="3207"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="2453" name="__module.model.model.layers.17.self_attn/aten::add/Add_1" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="3208"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="2454" name="__module.model.model.layers.17.self_attn/aten::cat/Concat_2" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="hidden_states.417,present.17.key"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="2455" name="Constant_102614_compressed" type="Const" version="opset1"> <data element_type="f16" shape="" offset="0" size="2" /> <output> <port id="0" precision="FP16" /> </output> </layer> <layer id="2456" name="Constant_102614" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16" /> </input> <output> <port id="1" precision="FP32" /> </output> </layer> <layer id="2457" name="Constant_102607" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="10" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2458" name="Constant_102609" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="2" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2459" name="Constant_102611" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="18" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2460" name="Concat_102612" type="Concat" version="opset1"> <data axis="0" /> <input> <port id="0" precision="I64"> <dim>1</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="4" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="2461" name="Broadcast_102615" type="Broadcast" version="opset3"> <data mode="numpy" /> <input> <port id="0" precision="FP32" /> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>0</dim> <dim>96</dim> </port> </output> </layer> <layer id="2462" name="ReadValue_101085" type="ReadValue" version="opset6"> <data variable_id="past_key_values.17.valuepresent.17.value" variable_type="f32" variable_shape="?,32,?,96" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>0</dim> <dim>96</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.17.value"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="2463" name="Constant_99956" type="Const" version="opset1"> <data element_type="i64" shape="" offset="2" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="2464" name="Gather_99957" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="2465" name="Constant_17374" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635656" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2466" name="Constant_17376" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635638" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2467" name="Constant_17378" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2468" name="__module.model.model.layers.17.self_attn/aten::slice/Slice_6" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>9216</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="3125,value_states.35"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2469" name="Constant_96658" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="56635456" size="32" /> <rt_info> <attribute name="precise" version="0" /> </rt_info> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="2470" name="__module.model.model.layers.17.self_attn/aten::view/Reshape_2" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="3133"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> </output> </layer> <layer id="2471" name="__module.model.model.layers.17.self_attn/aten::transpose/Constant_2" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="56635488" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="2472" name="__module.model.model.layers.17.self_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="3134"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="2473" name="__module.model.model.layers.17.self_attn/aten::cat/Concat_3" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="hidden_states.419,present.17.value"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="2474" name="__module.model.model.layers.17.self_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> <data causal="false" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="2" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="3" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>-1</dim> </port> </input> <output> <port id="4" precision="FP32" names="3218,attn_output.69"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="2475" name="__module.model.model.layers.17.self_attn/aten::transpose/Constant_3" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="56635488" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="2476" name="__module.model.model.layers.17.self_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="3219"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> </output> </layer> <layer id="2477" name="Constant_96659" type="Const" version="opset1"> <data element_type="i64" shape="3" offset="56635704" size="24" /> <rt_info> <attribute name="precise" version="0" /> </rt_info> <output> <port id="0" precision="I64"> <dim>3</dim> </port> </output> </layer> <layer id="2478" name="__module.model.model.layers.17.self_attn/aten::view/Reshape_3" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> <port id="1" precision="I64"> <dim>3</dim> </port> </input> <output> <port id="2" precision="FP32" names="3222"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2479" name="self.model.model.layers.17.self_attn.o_proj.weight_compressed" type="Const" version="opset1"> <data element_type="f16" shape="3072, 3072" offset="3907215700" size="18874368" /> <output> <port id="0" precision="FP16" names="self.model.model.layers.17.self_attn.o_proj.weight"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2480" name="self.model.model.layers.17.self_attn.o_proj.weight" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2481" name="__module.model.model.layers.17.self_attn.o_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="3224,3226,input.103"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2482" name="__module.model.model.layers.17/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="3230,3232,3243,hidden_states.421,hidden_states.423"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2483" name="Constant_90213_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 3072" offset="3926090068" size="6144" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2484" name="Constant_90213" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2485" name="Constant_90212_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12314" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2486" name="Constant_90212" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2487" name="Constant_90210_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12316" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2488" name="Constant_90210" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2489" name="__module.model.model.layers.17.post_attention_layernorm/aten::pow/Power" type="Power" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="3233"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2490" name="Constant_18236" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="12318" size="8" /> <output> <port id="0" precision="I64" names="3234"> <dim>1</dim> </port> </output> </layer> <layer id="2491" name="__module.model.model.layers.17.post_attention_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> <data keep_dims="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="3235,variance.71"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2492" name="Constant_90211_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12326" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2493" name="Constant_90211" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2494" name="__module.model.model.layers.17.post_attention_layernorm/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="3236"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2495" name="__module.model.model.layers.17.post_attention_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2496" name="__module.model.model.layers.17.post_attention_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> <data auto_broadcast="numpy" m_pythondiv="true" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="3237"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2497" name="__module.model.model.layers.17.post_attention_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="3238,3239,hidden_states.425,hidden_states.427"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2498" name="__module.model.model.layers.17.post_attention_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="3240,3242"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2499" name="self.model.model.layers.17.mlp.gate_up_proj.weight_compressed" type="Const" version="opset1"> <data element_type="f16" shape="16384, 3072" offset="3926096212" size="100663296" /> <output> <port id="0" precision="FP16" names="self.model.model.layers.17.mlp.gate_up_proj.weight"> <dim>16384</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2500" name="self.model.model.layers.17.mlp.gate_up_proj.weight" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>16384</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>16384</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2501" name="__module.model.model.layers.17.mlp.gate_up_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>16384</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="3247,up_states.69"> <dim>-1</dim> <dim>-1</dim> <dim>16384</dim> </port> </output> </layer> <layer id="2502" name="__module.model.model.layers.17.mlp/prim::ListUnpack/VariadicSplit" type="VariadicSplit" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16384</dim> </port> <port id="1" precision="I64" /> <port id="2" precision="I32"> <dim>2</dim> </port> </input> <output> <port id="3" precision="FP32" names="3249,input.105"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> <port id="4" precision="FP32" names="3250,up_states.71"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> </output> </layer> <layer id="2503" name="__module.model.model.layers.17.mlp.activation_fn/aten::silu/Swish" type="Swish" version="opset4"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> </input> <output> <port id="1" precision="FP32" names="3251"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> </output> </layer> <layer id="2504" name="__module.model.model.layers.17.mlp/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> </input> <output> <port id="2" precision="FP32" names="3252"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> </output> </layer> <layer id="2505" name="self.model.model.layers.17.mlp.down_proj.weight_compressed" type="Const" version="opset1"> <data element_type="f16" shape="3072, 8192" offset="4026759508" size="50331648" /> <output> <port id="0" precision="FP16" names="self.model.model.layers.17.mlp.down_proj.weight"> <dim>3072</dim> <dim>8192</dim> </port> </output> </layer> <layer id="2506" name="self.model.model.layers.17.mlp.down_proj.weight" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>8192</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>3072</dim> <dim>8192</dim> </port> </output> </layer> <layer id="2507" name="__module.model.model.layers.17.mlp.down_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> <port id="1" precision="FP32"> <dim>3072</dim> <dim>8192</dim> </port> </input> <output> <port id="2" precision="FP32" names="3254,input.107"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2508" name="__module.model.model.layers.17/aten::add/Add_1" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="3256,3258,3266,3277,hidden_states.431,hidden_states.433"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2509" name="Constant_90217_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 3072" offset="4077091156" size="6144" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2510" name="Constant_90217" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2511" name="Constant_90216_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12314" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2512" name="Constant_90216" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2513" name="Constant_90214_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12316" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2514" name="Constant_90214" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2515" name="__module.model.model.layers.18.input_layernorm/aten::pow/Power" type="Power" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="3267"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2516" name="Constant_18305" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="12318" size="8" /> <output> <port id="0" precision="I64" names="3268"> <dim>1</dim> </port> </output> </layer> <layer id="2517" name="__module.model.model.layers.18.input_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> <data keep_dims="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="3269,variance.73"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2518" name="Constant_90215_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12326" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2519" name="Constant_90215" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2520" name="__module.model.model.layers.18.input_layernorm/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="3270"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2521" name="__module.model.model.layers.18.input_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2522" name="__module.model.model.layers.18.input_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> <data auto_broadcast="numpy" m_pythondiv="true" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="3271"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2523" name="__module.model.model.layers.18.input_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="3272,3273,hidden_states.435,hidden_states.437"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2524" name="__module.model.model.layers.18.input_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="3274,3276,hidden_states.439"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2525" name="self.model.model.layers.18.self_attn.qkv_proj.weight_compressed" type="Const" version="opset1"> <data element_type="f16" shape="9216, 3072" offset="4077097300" size="56623104" /> <output> <port id="0" precision="FP16" names="self.model.model.layers.18.self_attn.qkv_proj.weight"> <dim>9216</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2526" name="self.model.model.layers.18.self_attn.qkv_proj.weight" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>9216</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>9216</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2527" name="__module.model.model.layers.18.self_attn.qkv_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>9216</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="3283,qkv.37"> <dim>-1</dim> <dim>-1</dim> <dim>9216</dim> </port> </output> </layer> <layer id="2528" name="Constant_18348" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="2" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2529" name="Constant_18350" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635432" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2530" name="Constant_18352" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2531" name="__module.model.model.layers.18.self_attn/aten::slice/Slice" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>9216</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="3284,query_states.37"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2532" name="Constant_96660" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="56635456" size="32" /> <rt_info> <attribute name="precise" version="0" /> </rt_info> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="2533" name="__module.model.model.layers.18.self_attn/aten::view/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="3288"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> </output> </layer> <layer id="2534" name="__module.model.model.layers.18.self_attn/aten::transpose/Constant" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="56635488" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="2535" name="__module.model.model.layers.18.self_attn/aten::transpose/Transpose" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="3289,q.37"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="2536" name="__module.model.model.layers.18.self_attn/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="3338"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="2537" name="Constant_18915" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635630" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2538" name="Constant_18917" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635638" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2539" name="Constant_18919" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2540" name="__module.model.model.layers.18.self_attn/aten::slice/Slice_1" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="3348,x2.73"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="2541" name="Constant_90218_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1, 1" offset="56635654" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2542" name="Constant_90218" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2543" name="__module.model.model.layers.18.self_attn/aten::neg/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="3349"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="2544" name="Constant_18812" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="2" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2545" name="Constant_18856" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635630" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2546" name="Constant_18858" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2547" name="__module.model.model.layers.18.self_attn/aten::slice/Slice_2" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="3343"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="2548" name="__module.model.model.layers.18.self_attn/aten::cat/Concat" type="Concat" version="opset1"> <data axis="-1" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </input> <output> <port id="2" precision="FP32" names="3351"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="2549" name="__module.model.model.layers.18.self_attn/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="3352"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="2550" name="__module.model.model.layers.18.self_attn/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="3353"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="2551" name="Constant_102650_compressed" type="Const" version="opset1"> <data element_type="f16" shape="" offset="0" size="2" /> <output> <port id="0" precision="FP16" /> </output> </layer> <layer id="2552" name="Constant_102650" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16" /> </input> <output> <port id="1" precision="FP32" /> </output> </layer> <layer id="2553" name="Constant_102643" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="10" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2554" name="Constant_102645" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="2" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2555" name="Constant_102647" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="18" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2556" name="Concat_102648" type="Concat" version="opset1"> <data axis="0" /> <input> <port id="0" precision="I64"> <dim>1</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="4" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="2557" name="Broadcast_102651" type="Broadcast" version="opset3"> <data mode="numpy" /> <input> <port id="0" precision="FP32" /> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>0</dim> <dim>96</dim> </port> </output> </layer> <layer id="2558" name="ReadValue_101087" type="ReadValue" version="opset6"> <data variable_id="past_key_values.18.keypresent.18.key" variable_type="f32" variable_shape="?,32,?,96" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>0</dim> <dim>96</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.18.key"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="2559" name="Constant_99959" type="Const" version="opset1"> <data element_type="i64" shape="" offset="2" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="2560" name="Gather_99960" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="2561" name="Constant_18358" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635432" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2562" name="Constant_18360" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635656" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2563" name="Constant_18362" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2564" name="__module.model.model.layers.18.self_attn/aten::slice/Slice_3" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>9216</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="3285,key_states.77"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2565" name="Constant_96661" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="56635456" size="32" /> <rt_info> <attribute name="precise" version="0" /> </rt_info> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="2566" name="__module.model.model.layers.18.self_attn/aten::view/Reshape_1" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="3291"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> </output> </layer> <layer id="2567" name="__module.model.model.layers.18.self_attn/aten::transpose/Constant_1" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="56635488" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="2568" name="__module.model.model.layers.18.self_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="3292,key_states.79"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="2569" name="__module.model.model.layers.18.self_attn/aten::mul/Multiply_2" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="3354"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="2570" name="Constant_19058" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635630" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2571" name="Constant_19060" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635638" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2572" name="Constant_19062" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2573" name="__module.model.model.layers.18.self_attn/aten::slice/Slice_4" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="3364,x2.75"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="2574" name="Constant_90219_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1, 1" offset="56635654" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2575" name="Constant_90219" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2576" name="__module.model.model.layers.18.self_attn/aten::neg/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="3365"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="2577" name="Constant_18955" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="2" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2578" name="Constant_18999" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635630" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2579" name="Constant_19001" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2580" name="__module.model.model.layers.18.self_attn/aten::slice/Slice_5" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="3359"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="2581" name="__module.model.model.layers.18.self_attn/aten::cat/Concat_1" type="Concat" version="opset1"> <data axis="-1" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </input> <output> <port id="2" precision="FP32" names="3367"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="2582" name="__module.model.model.layers.18.self_attn/aten::mul/Multiply_3" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="3368"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="2583" name="__module.model.model.layers.18.self_attn/aten::add/Add_1" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="3369"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="2584" name="__module.model.model.layers.18.self_attn/aten::cat/Concat_2" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="hidden_states.441,present.18.key"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="2585" name="Constant_102638_compressed" type="Const" version="opset1"> <data element_type="f16" shape="" offset="0" size="2" /> <output> <port id="0" precision="FP16" /> </output> </layer> <layer id="2586" name="Constant_102638" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16" /> </input> <output> <port id="1" precision="FP32" /> </output> </layer> <layer id="2587" name="Constant_102631" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="10" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2588" name="Constant_102633" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="2" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2589" name="Constant_102635" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="18" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2590" name="Concat_102636" type="Concat" version="opset1"> <data axis="0" /> <input> <port id="0" precision="I64"> <dim>1</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="4" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="2591" name="Broadcast_102639" type="Broadcast" version="opset3"> <data mode="numpy" /> <input> <port id="0" precision="FP32" /> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>0</dim> <dim>96</dim> </port> </output> </layer> <layer id="2592" name="ReadValue_101089" type="ReadValue" version="opset6"> <data variable_id="past_key_values.18.valuepresent.18.value" variable_type="f32" variable_shape="?,32,?,96" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>0</dim> <dim>96</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.18.value"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="2593" name="Constant_99962" type="Const" version="opset1"> <data element_type="i64" shape="" offset="2" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="2594" name="Gather_99963" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="2595" name="Constant_18368" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635656" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2596" name="Constant_18370" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635638" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2597" name="Constant_18372" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2598" name="__module.model.model.layers.18.self_attn/aten::slice/Slice_6" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>9216</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="3286,value_states.37"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2599" name="Constant_96662" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="56635456" size="32" /> <rt_info> <attribute name="precise" version="0" /> </rt_info> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="2600" name="__module.model.model.layers.18.self_attn/aten::view/Reshape_2" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="3294"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> </output> </layer> <layer id="2601" name="__module.model.model.layers.18.self_attn/aten::transpose/Constant_2" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="56635488" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="2602" name="__module.model.model.layers.18.self_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="3295"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="2603" name="__module.model.model.layers.18.self_attn/aten::cat/Concat_3" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="hidden_states.443,present.18.value"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="2604" name="__module.model.model.layers.18.self_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> <data causal="false" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="2" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="3" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>-1</dim> </port> </input> <output> <port id="4" precision="FP32" names="3379,attn_output.73"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="2605" name="__module.model.model.layers.18.self_attn/aten::transpose/Constant_3" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="56635488" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="2606" name="__module.model.model.layers.18.self_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="3380"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> </output> </layer> <layer id="2607" name="Constant_96663" type="Const" version="opset1"> <data element_type="i64" shape="3" offset="56635704" size="24" /> <rt_info> <attribute name="precise" version="0" /> </rt_info> <output> <port id="0" precision="I64"> <dim>3</dim> </port> </output> </layer> <layer id="2608" name="__module.model.model.layers.18.self_attn/aten::view/Reshape_3" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> <port id="1" precision="I64"> <dim>3</dim> </port> </input> <output> <port id="2" precision="FP32" names="3383"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2609" name="self.model.model.layers.18.self_attn.o_proj.weight_compressed" type="Const" version="opset1"> <data element_type="f16" shape="3072, 3072" offset="4133720404" size="18874368" /> <output> <port id="0" precision="FP16" names="self.model.model.layers.18.self_attn.o_proj.weight"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2610" name="self.model.model.layers.18.self_attn.o_proj.weight" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2611" name="__module.model.model.layers.18.self_attn.o_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="3385,3387,input.109"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2612" name="__module.model.model.layers.18/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="3391,3393,3404,hidden_states.445,hidden_states.447"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2613" name="Constant_90223_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 3072" offset="4152594772" size="6144" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2614" name="Constant_90223" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2615" name="Constant_90222_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12314" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2616" name="Constant_90222" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2617" name="Constant_90220_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12316" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2618" name="Constant_90220" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2619" name="__module.model.model.layers.18.post_attention_layernorm/aten::pow/Power" type="Power" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="3394"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2620" name="Constant_19230" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="12318" size="8" /> <output> <port id="0" precision="I64" names="3395"> <dim>1</dim> </port> </output> </layer> <layer id="2621" name="__module.model.model.layers.18.post_attention_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> <data keep_dims="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="3396,variance.75"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2622" name="Constant_90221_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12326" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2623" name="Constant_90221" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2624" name="__module.model.model.layers.18.post_attention_layernorm/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="3397"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2625" name="__module.model.model.layers.18.post_attention_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2626" name="__module.model.model.layers.18.post_attention_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> <data auto_broadcast="numpy" m_pythondiv="true" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="3398"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2627" name="__module.model.model.layers.18.post_attention_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="3399,3400,hidden_states.449,hidden_states.451"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2628" name="__module.model.model.layers.18.post_attention_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="3401,3403"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2629" name="self.model.model.layers.18.mlp.gate_up_proj.weight_compressed" type="Const" version="opset1"> <data element_type="f16" shape="16384, 3072" offset="4152600916" size="100663296" /> <output> <port id="0" precision="FP16" names="self.model.model.layers.18.mlp.gate_up_proj.weight"> <dim>16384</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2630" name="self.model.model.layers.18.mlp.gate_up_proj.weight" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>16384</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>16384</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2631" name="__module.model.model.layers.18.mlp.gate_up_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>16384</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="3408,up_states.73"> <dim>-1</dim> <dim>-1</dim> <dim>16384</dim> </port> </output> </layer> <layer id="2632" name="__module.model.model.layers.18.mlp/prim::ListUnpack/VariadicSplit" type="VariadicSplit" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16384</dim> </port> <port id="1" precision="I64" /> <port id="2" precision="I32"> <dim>2</dim> </port> </input> <output> <port id="3" precision="FP32" names="3410,input.111"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> <port id="4" precision="FP32" names="3411,up_states.75"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> </output> </layer> <layer id="2633" name="__module.model.model.layers.18.mlp.activation_fn/aten::silu/Swish" type="Swish" version="opset4"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> </input> <output> <port id="1" precision="FP32" names="3412"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> </output> </layer> <layer id="2634" name="__module.model.model.layers.18.mlp/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> </input> <output> <port id="2" precision="FP32" names="3413"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> </output> </layer> <layer id="2635" name="self.model.model.layers.18.mlp.down_proj.weight_compressed" type="Const" version="opset1"> <data element_type="f16" shape="3072, 8192" offset="4253264212" size="50331648" /> <output> <port id="0" precision="FP16" names="self.model.model.layers.18.mlp.down_proj.weight"> <dim>3072</dim> <dim>8192</dim> </port> </output> </layer> <layer id="2636" name="self.model.model.layers.18.mlp.down_proj.weight" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>8192</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>3072</dim> <dim>8192</dim> </port> </output> </layer> <layer id="2637" name="__module.model.model.layers.18.mlp.down_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> <port id="1" precision="FP32"> <dim>3072</dim> <dim>8192</dim> </port> </input> <output> <port id="2" precision="FP32" names="3415,input.113"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2638" name="__module.model.model.layers.18/aten::add/Add_1" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="3417,3419,3427,3438,hidden_states.455,hidden_states.457"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2639" name="Constant_90227_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 3072" offset="4303595860" size="6144" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2640" name="Constant_90227" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2641" name="Constant_90226_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12314" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2642" name="Constant_90226" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2643" name="Constant_90224_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12316" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2644" name="Constant_90224" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2645" name="__module.model.model.layers.19.input_layernorm/aten::pow/Power" type="Power" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="3428"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2646" name="Constant_19299" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="12318" size="8" /> <output> <port id="0" precision="I64" names="3429"> <dim>1</dim> </port> </output> </layer> <layer id="2647" name="__module.model.model.layers.19.input_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> <data keep_dims="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="3430,variance.77"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2648" name="Constant_90225_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12326" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2649" name="Constant_90225" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2650" name="__module.model.model.layers.19.input_layernorm/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="3431"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2651" name="__module.model.model.layers.19.input_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2652" name="__module.model.model.layers.19.input_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> <data auto_broadcast="numpy" m_pythondiv="true" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="3432"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2653" name="__module.model.model.layers.19.input_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="3433,3434,hidden_states.459,hidden_states.461"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2654" name="__module.model.model.layers.19.input_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="3435,3437,hidden_states.463"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2655" name="self.model.model.layers.19.self_attn.qkv_proj.weight_compressed" type="Const" version="opset1"> <data element_type="f16" shape="9216, 3072" offset="4303602004" size="56623104" /> <output> <port id="0" precision="FP16" names="self.model.model.layers.19.self_attn.qkv_proj.weight"> <dim>9216</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2656" name="self.model.model.layers.19.self_attn.qkv_proj.weight" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>9216</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>9216</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2657" name="__module.model.model.layers.19.self_attn.qkv_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>9216</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="3444,qkv.39"> <dim>-1</dim> <dim>-1</dim> <dim>9216</dim> </port> </output> </layer> <layer id="2658" name="Constant_19342" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="2" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2659" name="Constant_19344" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635432" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2660" name="Constant_19346" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2661" name="__module.model.model.layers.19.self_attn/aten::slice/Slice" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>9216</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="3445,query_states.39"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2662" name="Constant_96664" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="56635456" size="32" /> <rt_info> <attribute name="precise" version="0" /> </rt_info> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="2663" name="__module.model.model.layers.19.self_attn/aten::view/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="3449"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> </output> </layer> <layer id="2664" name="__module.model.model.layers.19.self_attn/aten::transpose/Constant" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="56635488" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="2665" name="__module.model.model.layers.19.self_attn/aten::transpose/Transpose" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="3450,q.39"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="2666" name="__module.model.model.layers.19.self_attn/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="3499"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="2667" name="Constant_19909" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635630" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2668" name="Constant_19911" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635638" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2669" name="Constant_19913" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2670" name="__module.model.model.layers.19.self_attn/aten::slice/Slice_1" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="3509,x2.77"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="2671" name="Constant_90228_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1, 1" offset="56635654" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2672" name="Constant_90228" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2673" name="__module.model.model.layers.19.self_attn/aten::neg/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="3510"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="2674" name="Constant_19806" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="2" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2675" name="Constant_19850" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635630" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2676" name="Constant_19852" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2677" name="__module.model.model.layers.19.self_attn/aten::slice/Slice_2" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="3504"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="2678" name="__module.model.model.layers.19.self_attn/aten::cat/Concat" type="Concat" version="opset1"> <data axis="-1" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </input> <output> <port id="2" precision="FP32" names="3512"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="2679" name="__module.model.model.layers.19.self_attn/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="3513"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="2680" name="__module.model.model.layers.19.self_attn/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="3514"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="2681" name="Constant_102674_compressed" type="Const" version="opset1"> <data element_type="f16" shape="" offset="0" size="2" /> <output> <port id="0" precision="FP16" /> </output> </layer> <layer id="2682" name="Constant_102674" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16" /> </input> <output> <port id="1" precision="FP32" /> </output> </layer> <layer id="2683" name="Constant_102667" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="10" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2684" name="Constant_102669" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="2" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2685" name="Constant_102671" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="18" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2686" name="Concat_102672" type="Concat" version="opset1"> <data axis="0" /> <input> <port id="0" precision="I64"> <dim>1</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="4" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="2687" name="Broadcast_102675" type="Broadcast" version="opset3"> <data mode="numpy" /> <input> <port id="0" precision="FP32" /> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>0</dim> <dim>96</dim> </port> </output> </layer> <layer id="2688" name="ReadValue_101091" type="ReadValue" version="opset6"> <data variable_id="past_key_values.19.keypresent.19.key" variable_type="f32" variable_shape="?,32,?,96" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>0</dim> <dim>96</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.19.key"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="2689" name="Constant_99965" type="Const" version="opset1"> <data element_type="i64" shape="" offset="2" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="2690" name="Gather_99966" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="2691" name="Constant_19352" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635432" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2692" name="Constant_19354" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635656" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2693" name="Constant_19356" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2694" name="__module.model.model.layers.19.self_attn/aten::slice/Slice_3" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>9216</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="3446,key_states.81"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2695" name="Constant_96665" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="56635456" size="32" /> <rt_info> <attribute name="precise" version="0" /> </rt_info> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="2696" name="__module.model.model.layers.19.self_attn/aten::view/Reshape_1" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="3452"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> </output> </layer> <layer id="2697" name="__module.model.model.layers.19.self_attn/aten::transpose/Constant_1" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="56635488" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="2698" name="__module.model.model.layers.19.self_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="3453,key_states.83"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="2699" name="__module.model.model.layers.19.self_attn/aten::mul/Multiply_2" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="3515"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="2700" name="Constant_20052" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635630" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2701" name="Constant_20054" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635638" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2702" name="Constant_20056" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2703" name="__module.model.model.layers.19.self_attn/aten::slice/Slice_4" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="3525,x2.79"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="2704" name="Constant_90229_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1, 1" offset="56635654" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2705" name="Constant_90229" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2706" name="__module.model.model.layers.19.self_attn/aten::neg/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="3526"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="2707" name="Constant_19949" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="2" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2708" name="Constant_19993" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635630" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2709" name="Constant_19995" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2710" name="__module.model.model.layers.19.self_attn/aten::slice/Slice_5" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="3520"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="2711" name="__module.model.model.layers.19.self_attn/aten::cat/Concat_1" type="Concat" version="opset1"> <data axis="-1" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </input> <output> <port id="2" precision="FP32" names="3528"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="2712" name="__module.model.model.layers.19.self_attn/aten::mul/Multiply_3" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="3529"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="2713" name="__module.model.model.layers.19.self_attn/aten::add/Add_1" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="3530"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="2714" name="__module.model.model.layers.19.self_attn/aten::cat/Concat_2" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="hidden_states.465,present.19.key"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="2715" name="Constant_102662_compressed" type="Const" version="opset1"> <data element_type="f16" shape="" offset="0" size="2" /> <output> <port id="0" precision="FP16" /> </output> </layer> <layer id="2716" name="Constant_102662" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16" /> </input> <output> <port id="1" precision="FP32" /> </output> </layer> <layer id="2717" name="Constant_102655" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="10" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2718" name="Constant_102657" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="2" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2719" name="Constant_102659" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="18" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2720" name="Concat_102660" type="Concat" version="opset1"> <data axis="0" /> <input> <port id="0" precision="I64"> <dim>1</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="4" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="2721" name="Broadcast_102663" type="Broadcast" version="opset3"> <data mode="numpy" /> <input> <port id="0" precision="FP32" /> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>0</dim> <dim>96</dim> </port> </output> </layer> <layer id="2722" name="ReadValue_101093" type="ReadValue" version="opset6"> <data variable_id="past_key_values.19.valuepresent.19.value" variable_type="f32" variable_shape="?,32,?,96" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>0</dim> <dim>96</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.19.value"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="2723" name="Constant_99968" type="Const" version="opset1"> <data element_type="i64" shape="" offset="2" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="2724" name="Gather_99969" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="2725" name="Constant_19362" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635656" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2726" name="Constant_19364" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635638" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2727" name="Constant_19366" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2728" name="__module.model.model.layers.19.self_attn/aten::slice/Slice_6" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>9216</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="3447,value_states.39"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2729" name="Constant_96666" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="56635456" size="32" /> <rt_info> <attribute name="precise" version="0" /> </rt_info> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="2730" name="__module.model.model.layers.19.self_attn/aten::view/Reshape_2" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="3455"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> </output> </layer> <layer id="2731" name="__module.model.model.layers.19.self_attn/aten::transpose/Constant_2" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="56635488" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="2732" name="__module.model.model.layers.19.self_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="3456"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="2733" name="__module.model.model.layers.19.self_attn/aten::cat/Concat_3" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="hidden_states.467,present.19.value"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="2734" name="__module.model.model.layers.19.self_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> <data causal="false" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="2" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="3" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>-1</dim> </port> </input> <output> <port id="4" precision="FP32" names="3540,attn_output.77"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="2735" name="__module.model.model.layers.19.self_attn/aten::transpose/Constant_3" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="56635488" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="2736" name="__module.model.model.layers.19.self_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="3541"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> </output> </layer> <layer id="2737" name="Constant_96667" type="Const" version="opset1"> <data element_type="i64" shape="3" offset="56635704" size="24" /> <rt_info> <attribute name="precise" version="0" /> </rt_info> <output> <port id="0" precision="I64"> <dim>3</dim> </port> </output> </layer> <layer id="2738" name="__module.model.model.layers.19.self_attn/aten::view/Reshape_3" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> <port id="1" precision="I64"> <dim>3</dim> </port> </input> <output> <port id="2" precision="FP32" names="3544"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2739" name="self.model.model.layers.19.self_attn.o_proj.weight_compressed" type="Const" version="opset1"> <data element_type="f16" shape="3072, 3072" offset="4360225108" size="18874368" /> <output> <port id="0" precision="FP16" names="self.model.model.layers.19.self_attn.o_proj.weight"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2740" name="self.model.model.layers.19.self_attn.o_proj.weight" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2741" name="__module.model.model.layers.19.self_attn.o_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="3546,3548,input.115"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2742" name="__module.model.model.layers.19/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="3552,3554,3565,hidden_states.469,hidden_states.471"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2743" name="Constant_90233_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 3072" offset="4379099476" size="6144" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2744" name="Constant_90233" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2745" name="Constant_90232_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12314" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2746" name="Constant_90232" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2747" name="Constant_90230_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12316" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2748" name="Constant_90230" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2749" name="__module.model.model.layers.19.post_attention_layernorm/aten::pow/Power" type="Power" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="3555"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2750" name="Constant_20224" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="12318" size="8" /> <output> <port id="0" precision="I64" names="3556"> <dim>1</dim> </port> </output> </layer> <layer id="2751" name="__module.model.model.layers.19.post_attention_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> <data keep_dims="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="3557,variance.79"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2752" name="Constant_90231_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12326" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2753" name="Constant_90231" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2754" name="__module.model.model.layers.19.post_attention_layernorm/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="3558"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2755" name="__module.model.model.layers.19.post_attention_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2756" name="__module.model.model.layers.19.post_attention_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> <data auto_broadcast="numpy" m_pythondiv="true" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="3559"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2757" name="__module.model.model.layers.19.post_attention_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="3560,3561,hidden_states.473,hidden_states.475"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2758" name="__module.model.model.layers.19.post_attention_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="3562,3564"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2759" name="self.model.model.layers.19.mlp.gate_up_proj.weight_compressed" type="Const" version="opset1"> <data element_type="f16" shape="16384, 3072" offset="4379105620" size="100663296" /> <output> <port id="0" precision="FP16" names="self.model.model.layers.19.mlp.gate_up_proj.weight"> <dim>16384</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2760" name="self.model.model.layers.19.mlp.gate_up_proj.weight" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>16384</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>16384</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2761" name="__module.model.model.layers.19.mlp.gate_up_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>16384</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="3569,up_states.77"> <dim>-1</dim> <dim>-1</dim> <dim>16384</dim> </port> </output> </layer> <layer id="2762" name="__module.model.model.layers.19.mlp/prim::ListUnpack/VariadicSplit" type="VariadicSplit" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16384</dim> </port> <port id="1" precision="I64" /> <port id="2" precision="I32"> <dim>2</dim> </port> </input> <output> <port id="3" precision="FP32" names="3571,input.117"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> <port id="4" precision="FP32" names="3572,up_states.79"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> </output> </layer> <layer id="2763" name="__module.model.model.layers.19.mlp.activation_fn/aten::silu/Swish" type="Swish" version="opset4"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> </input> <output> <port id="1" precision="FP32" names="3573"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> </output> </layer> <layer id="2764" name="__module.model.model.layers.19.mlp/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> </input> <output> <port id="2" precision="FP32" names="3574"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> </output> </layer> <layer id="2765" name="self.model.model.layers.19.mlp.down_proj.weight_compressed" type="Const" version="opset1"> <data element_type="f16" shape="3072, 8192" offset="4479768916" size="50331648" /> <output> <port id="0" precision="FP16" names="self.model.model.layers.19.mlp.down_proj.weight"> <dim>3072</dim> <dim>8192</dim> </port> </output> </layer> <layer id="2766" name="self.model.model.layers.19.mlp.down_proj.weight" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>8192</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>3072</dim> <dim>8192</dim> </port> </output> </layer> <layer id="2767" name="__module.model.model.layers.19.mlp.down_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> <port id="1" precision="FP32"> <dim>3072</dim> <dim>8192</dim> </port> </input> <output> <port id="2" precision="FP32" names="3576,input.119"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2768" name="__module.model.model.layers.19/aten::add/Add_1" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="3578,3580,3588,3599,hidden_states.479,hidden_states.481"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2769" name="Constant_90237_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 3072" offset="4530100564" size="6144" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2770" name="Constant_90237" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2771" name="Constant_90236_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12314" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2772" name="Constant_90236" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2773" name="Constant_90234_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12316" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2774" name="Constant_90234" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2775" name="__module.model.model.layers.20.input_layernorm/aten::pow/Power" type="Power" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="3589"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2776" name="Constant_20293" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="12318" size="8" /> <output> <port id="0" precision="I64" names="3590"> <dim>1</dim> </port> </output> </layer> <layer id="2777" name="__module.model.model.layers.20.input_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> <data keep_dims="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="3591,variance.81"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2778" name="Constant_90235_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12326" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2779" name="Constant_90235" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2780" name="__module.model.model.layers.20.input_layernorm/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="3592"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2781" name="__module.model.model.layers.20.input_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2782" name="__module.model.model.layers.20.input_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> <data auto_broadcast="numpy" m_pythondiv="true" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="3593"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2783" name="__module.model.model.layers.20.input_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="3594,3595,hidden_states.483,hidden_states.485"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2784" name="__module.model.model.layers.20.input_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="3596,3598,hidden_states.487"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2785" name="self.model.model.layers.20.self_attn.qkv_proj.weight_compressed" type="Const" version="opset1"> <data element_type="f16" shape="9216, 3072" offset="4530106708" size="56623104" /> <output> <port id="0" precision="FP16" names="self.model.model.layers.20.self_attn.qkv_proj.weight"> <dim>9216</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2786" name="self.model.model.layers.20.self_attn.qkv_proj.weight" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>9216</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>9216</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2787" name="__module.model.model.layers.20.self_attn.qkv_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>9216</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="3605,qkv.41"> <dim>-1</dim> <dim>-1</dim> <dim>9216</dim> </port> </output> </layer> <layer id="2788" name="Constant_20336" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="2" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2789" name="Constant_20338" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635432" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2790" name="Constant_20340" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2791" name="__module.model.model.layers.20.self_attn/aten::slice/Slice" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>9216</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="3606,query_states.41"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2792" name="Constant_96668" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="56635456" size="32" /> <rt_info> <attribute name="precise" version="0" /> </rt_info> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="2793" name="__module.model.model.layers.20.self_attn/aten::view/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="3610"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> </output> </layer> <layer id="2794" name="__module.model.model.layers.20.self_attn/aten::transpose/Constant" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="56635488" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="2795" name="__module.model.model.layers.20.self_attn/aten::transpose/Transpose" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="3611,q.41"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="2796" name="__module.model.model.layers.20.self_attn/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="3660"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="2797" name="Constant_20903" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635630" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2798" name="Constant_20905" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635638" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2799" name="Constant_20907" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2800" name="__module.model.model.layers.20.self_attn/aten::slice/Slice_1" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="3670,x2.81"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="2801" name="Constant_90238_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1, 1" offset="56635654" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2802" name="Constant_90238" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2803" name="__module.model.model.layers.20.self_attn/aten::neg/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="3671"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="2804" name="Constant_20800" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="2" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2805" name="Constant_20844" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635630" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2806" name="Constant_20846" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2807" name="__module.model.model.layers.20.self_attn/aten::slice/Slice_2" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="3665"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="2808" name="__module.model.model.layers.20.self_attn/aten::cat/Concat" type="Concat" version="opset1"> <data axis="-1" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </input> <output> <port id="2" precision="FP32" names="3673"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="2809" name="__module.model.model.layers.20.self_attn/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="3674"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="2810" name="__module.model.model.layers.20.self_attn/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="3675"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="2811" name="Constant_102698_compressed" type="Const" version="opset1"> <data element_type="f16" shape="" offset="0" size="2" /> <output> <port id="0" precision="FP16" /> </output> </layer> <layer id="2812" name="Constant_102698" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16" /> </input> <output> <port id="1" precision="FP32" /> </output> </layer> <layer id="2813" name="Constant_102691" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="10" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2814" name="Constant_102693" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="2" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2815" name="Constant_102695" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="18" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2816" name="Concat_102696" type="Concat" version="opset1"> <data axis="0" /> <input> <port id="0" precision="I64"> <dim>1</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="4" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="2817" name="Broadcast_102699" type="Broadcast" version="opset3"> <data mode="numpy" /> <input> <port id="0" precision="FP32" /> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>0</dim> <dim>96</dim> </port> </output> </layer> <layer id="2818" name="ReadValue_101099" type="ReadValue" version="opset6"> <data variable_id="past_key_values.20.keypresent.20.key" variable_type="f32" variable_shape="?,32,?,96" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>0</dim> <dim>96</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.20.key"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="2819" name="Constant_99971" type="Const" version="opset1"> <data element_type="i64" shape="" offset="2" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="2820" name="Gather_99972" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="2821" name="Constant_20346" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635432" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2822" name="Constant_20348" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635656" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2823" name="Constant_20350" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2824" name="__module.model.model.layers.20.self_attn/aten::slice/Slice_3" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>9216</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="3607,key_states.85"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2825" name="Constant_96669" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="56635456" size="32" /> <rt_info> <attribute name="precise" version="0" /> </rt_info> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="2826" name="__module.model.model.layers.20.self_attn/aten::view/Reshape_1" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="3613"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> </output> </layer> <layer id="2827" name="__module.model.model.layers.20.self_attn/aten::transpose/Constant_1" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="56635488" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="2828" name="__module.model.model.layers.20.self_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="3614,key_states.87"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="2829" name="__module.model.model.layers.20.self_attn/aten::mul/Multiply_2" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="3676"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="2830" name="Constant_21046" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635630" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2831" name="Constant_21048" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635638" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2832" name="Constant_21050" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2833" name="__module.model.model.layers.20.self_attn/aten::slice/Slice_4" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="3686,x2.83"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="2834" name="Constant_90239_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1, 1" offset="56635654" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2835" name="Constant_90239" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2836" name="__module.model.model.layers.20.self_attn/aten::neg/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="3687"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="2837" name="Constant_20943" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="2" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2838" name="Constant_20987" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635630" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2839" name="Constant_20989" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2840" name="__module.model.model.layers.20.self_attn/aten::slice/Slice_5" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="3681"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="2841" name="__module.model.model.layers.20.self_attn/aten::cat/Concat_1" type="Concat" version="opset1"> <data axis="-1" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </input> <output> <port id="2" precision="FP32" names="3689"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="2842" name="__module.model.model.layers.20.self_attn/aten::mul/Multiply_3" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="3690"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="2843" name="__module.model.model.layers.20.self_attn/aten::add/Add_1" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="3691"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="2844" name="__module.model.model.layers.20.self_attn/aten::cat/Concat_2" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="hidden_states.489,present.20.key"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="2845" name="Constant_102686_compressed" type="Const" version="opset1"> <data element_type="f16" shape="" offset="0" size="2" /> <output> <port id="0" precision="FP16" /> </output> </layer> <layer id="2846" name="Constant_102686" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16" /> </input> <output> <port id="1" precision="FP32" /> </output> </layer> <layer id="2847" name="Constant_102679" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="10" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2848" name="Constant_102681" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="2" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2849" name="Constant_102683" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="18" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2850" name="Concat_102684" type="Concat" version="opset1"> <data axis="0" /> <input> <port id="0" precision="I64"> <dim>1</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="4" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="2851" name="Broadcast_102687" type="Broadcast" version="opset3"> <data mode="numpy" /> <input> <port id="0" precision="FP32" /> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>0</dim> <dim>96</dim> </port> </output> </layer> <layer id="2852" name="ReadValue_101101" type="ReadValue" version="opset6"> <data variable_id="past_key_values.20.valuepresent.20.value" variable_type="f32" variable_shape="?,32,?,96" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>0</dim> <dim>96</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.20.value"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="2853" name="Constant_99974" type="Const" version="opset1"> <data element_type="i64" shape="" offset="2" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="2854" name="Gather_99975" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="2855" name="Constant_20356" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635656" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2856" name="Constant_20358" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635638" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2857" name="Constant_20360" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2858" name="__module.model.model.layers.20.self_attn/aten::slice/Slice_6" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>9216</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="3608,value_states.41"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2859" name="Constant_96670" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="56635456" size="32" /> <rt_info> <attribute name="precise" version="0" /> </rt_info> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="2860" name="__module.model.model.layers.20.self_attn/aten::view/Reshape_2" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="3616"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> </output> </layer> <layer id="2861" name="__module.model.model.layers.20.self_attn/aten::transpose/Constant_2" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="56635488" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="2862" name="__module.model.model.layers.20.self_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="3617"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="2863" name="__module.model.model.layers.20.self_attn/aten::cat/Concat_3" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="hidden_states.491,present.20.value"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="2864" name="__module.model.model.layers.20.self_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> <data causal="false" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="2" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="3" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>-1</dim> </port> </input> <output> <port id="4" precision="FP32" names="3701,attn_output.81"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="2865" name="__module.model.model.layers.20.self_attn/aten::transpose/Constant_3" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="56635488" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="2866" name="__module.model.model.layers.20.self_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="3702"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> </output> </layer> <layer id="2867" name="Constant_96671" type="Const" version="opset1"> <data element_type="i64" shape="3" offset="56635704" size="24" /> <rt_info> <attribute name="precise" version="0" /> </rt_info> <output> <port id="0" precision="I64"> <dim>3</dim> </port> </output> </layer> <layer id="2868" name="__module.model.model.layers.20.self_attn/aten::view/Reshape_3" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> <port id="1" precision="I64"> <dim>3</dim> </port> </input> <output> <port id="2" precision="FP32" names="3705"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2869" name="self.model.model.layers.20.self_attn.o_proj.weight_compressed" type="Const" version="opset1"> <data element_type="f16" shape="3072, 3072" offset="4586729812" size="18874368" /> <output> <port id="0" precision="FP16" names="self.model.model.layers.20.self_attn.o_proj.weight"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2870" name="self.model.model.layers.20.self_attn.o_proj.weight" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2871" name="__module.model.model.layers.20.self_attn.o_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="3707,3709,input.121"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2872" name="__module.model.model.layers.20/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="3713,3715,3726,hidden_states.493,hidden_states.495"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2873" name="Constant_90243_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 3072" offset="4605604180" size="6144" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2874" name="Constant_90243" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2875" name="Constant_90242_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12314" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2876" name="Constant_90242" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2877" name="Constant_90240_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12316" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2878" name="Constant_90240" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2879" name="__module.model.model.layers.20.post_attention_layernorm/aten::pow/Power" type="Power" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="3716"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2880" name="Constant_21218" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="12318" size="8" /> <output> <port id="0" precision="I64" names="3717"> <dim>1</dim> </port> </output> </layer> <layer id="2881" name="__module.model.model.layers.20.post_attention_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> <data keep_dims="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="3718,variance.83"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2882" name="Constant_90241_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12326" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2883" name="Constant_90241" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2884" name="__module.model.model.layers.20.post_attention_layernorm/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="3719"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2885" name="__module.model.model.layers.20.post_attention_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2886" name="__module.model.model.layers.20.post_attention_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> <data auto_broadcast="numpy" m_pythondiv="true" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="3720"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2887" name="__module.model.model.layers.20.post_attention_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="3721,3722,hidden_states.497,hidden_states.499"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2888" name="__module.model.model.layers.20.post_attention_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="3723,3725"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2889" name="self.model.model.layers.20.mlp.gate_up_proj.weight_compressed" type="Const" version="opset1"> <data element_type="f16" shape="16384, 3072" offset="4605610324" size="100663296" /> <output> <port id="0" precision="FP16" names="self.model.model.layers.20.mlp.gate_up_proj.weight"> <dim>16384</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2890" name="self.model.model.layers.20.mlp.gate_up_proj.weight" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>16384</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>16384</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2891" name="__module.model.model.layers.20.mlp.gate_up_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>16384</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="3730,up_states.81"> <dim>-1</dim> <dim>-1</dim> <dim>16384</dim> </port> </output> </layer> <layer id="2892" name="__module.model.model.layers.20.mlp/prim::ListUnpack/VariadicSplit" type="VariadicSplit" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16384</dim> </port> <port id="1" precision="I64" /> <port id="2" precision="I32"> <dim>2</dim> </port> </input> <output> <port id="3" precision="FP32" names="3732,input.123"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> <port id="4" precision="FP32" names="3733,up_states.83"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> </output> </layer> <layer id="2893" name="__module.model.model.layers.20.mlp.activation_fn/aten::silu/Swish" type="Swish" version="opset4"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> </input> <output> <port id="1" precision="FP32" names="3734"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> </output> </layer> <layer id="2894" name="__module.model.model.layers.20.mlp/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> </input> <output> <port id="2" precision="FP32" names="3735"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> </output> </layer> <layer id="2895" name="self.model.model.layers.20.mlp.down_proj.weight_compressed" type="Const" version="opset1"> <data element_type="f16" shape="3072, 8192" offset="4706273620" size="50331648" /> <output> <port id="0" precision="FP16" names="self.model.model.layers.20.mlp.down_proj.weight"> <dim>3072</dim> <dim>8192</dim> </port> </output> </layer> <layer id="2896" name="self.model.model.layers.20.mlp.down_proj.weight" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>8192</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>3072</dim> <dim>8192</dim> </port> </output> </layer> <layer id="2897" name="__module.model.model.layers.20.mlp.down_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> <port id="1" precision="FP32"> <dim>3072</dim> <dim>8192</dim> </port> </input> <output> <port id="2" precision="FP32" names="3737,input.125"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2898" name="__module.model.model.layers.20/aten::add/Add_1" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="3739,3741,3749,3760,hidden_states.503,hidden_states.505"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2899" name="Constant_90247_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 3072" offset="4756605268" size="6144" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2900" name="Constant_90247" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2901" name="Constant_90246_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12314" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2902" name="Constant_90246" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2903" name="Constant_90244_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12316" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2904" name="Constant_90244" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2905" name="__module.model.model.layers.21.input_layernorm/aten::pow/Power" type="Power" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="3750"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2906" name="Constant_21287" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="12318" size="8" /> <output> <port id="0" precision="I64" names="3751"> <dim>1</dim> </port> </output> </layer> <layer id="2907" name="__module.model.model.layers.21.input_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> <data keep_dims="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="3752,variance.85"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2908" name="Constant_90245_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12326" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2909" name="Constant_90245" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2910" name="__module.model.model.layers.21.input_layernorm/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="3753"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2911" name="__module.model.model.layers.21.input_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2912" name="__module.model.model.layers.21.input_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> <data auto_broadcast="numpy" m_pythondiv="true" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="3754"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2913" name="__module.model.model.layers.21.input_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="3755,3756,hidden_states.507,hidden_states.509"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2914" name="__module.model.model.layers.21.input_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="3757,3759,hidden_states.511"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2915" name="self.model.model.layers.21.self_attn.qkv_proj.weight_compressed" type="Const" version="opset1"> <data element_type="f16" shape="9216, 3072" offset="4756611412" size="56623104" /> <output> <port id="0" precision="FP16" names="self.model.model.layers.21.self_attn.qkv_proj.weight"> <dim>9216</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2916" name="self.model.model.layers.21.self_attn.qkv_proj.weight" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>9216</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>9216</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2917" name="__module.model.model.layers.21.self_attn.qkv_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>9216</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="3766,qkv.43"> <dim>-1</dim> <dim>-1</dim> <dim>9216</dim> </port> </output> </layer> <layer id="2918" name="Constant_21330" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="2" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2919" name="Constant_21332" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635432" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2920" name="Constant_21334" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2921" name="__module.model.model.layers.21.self_attn/aten::slice/Slice" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>9216</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="3767,query_states.43"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2922" name="Constant_96672" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="56635456" size="32" /> <rt_info> <attribute name="precise" version="0" /> </rt_info> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="2923" name="__module.model.model.layers.21.self_attn/aten::view/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="3771"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> </output> </layer> <layer id="2924" name="__module.model.model.layers.21.self_attn/aten::transpose/Constant" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="56635488" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="2925" name="__module.model.model.layers.21.self_attn/aten::transpose/Transpose" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="3772,q.43"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="2926" name="__module.model.model.layers.21.self_attn/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="3821"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="2927" name="Constant_21897" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635630" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2928" name="Constant_21899" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635638" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2929" name="Constant_21901" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2930" name="__module.model.model.layers.21.self_attn/aten::slice/Slice_1" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="3831,x2.85"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="2931" name="Constant_90248_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1, 1" offset="56635654" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2932" name="Constant_90248" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2933" name="__module.model.model.layers.21.self_attn/aten::neg/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="3832"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="2934" name="Constant_21794" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="2" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2935" name="Constant_21838" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635630" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2936" name="Constant_21840" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2937" name="__module.model.model.layers.21.self_attn/aten::slice/Slice_2" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="3826"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="2938" name="__module.model.model.layers.21.self_attn/aten::cat/Concat" type="Concat" version="opset1"> <data axis="-1" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </input> <output> <port id="2" precision="FP32" names="3834"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="2939" name="__module.model.model.layers.21.self_attn/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="3835"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="2940" name="__module.model.model.layers.21.self_attn/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="3836"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="2941" name="Constant_102722_compressed" type="Const" version="opset1"> <data element_type="f16" shape="" offset="0" size="2" /> <output> <port id="0" precision="FP16" /> </output> </layer> <layer id="2942" name="Constant_102722" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16" /> </input> <output> <port id="1" precision="FP32" /> </output> </layer> <layer id="2943" name="Constant_102715" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="10" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2944" name="Constant_102717" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="2" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2945" name="Constant_102719" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="18" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2946" name="Concat_102720" type="Concat" version="opset1"> <data axis="0" /> <input> <port id="0" precision="I64"> <dim>1</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="4" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="2947" name="Broadcast_102723" type="Broadcast" version="opset3"> <data mode="numpy" /> <input> <port id="0" precision="FP32" /> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>0</dim> <dim>96</dim> </port> </output> </layer> <layer id="2948" name="ReadValue_101103" type="ReadValue" version="opset6"> <data variable_id="past_key_values.21.keypresent.21.key" variable_type="f32" variable_shape="?,32,?,96" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>0</dim> <dim>96</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.21.key"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="2949" name="Constant_99977" type="Const" version="opset1"> <data element_type="i64" shape="" offset="2" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="2950" name="Gather_99978" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="2951" name="Constant_21340" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635432" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2952" name="Constant_21342" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635656" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2953" name="Constant_21344" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2954" name="__module.model.model.layers.21.self_attn/aten::slice/Slice_3" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>9216</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="3768,key_states.89"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2955" name="Constant_96673" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="56635456" size="32" /> <rt_info> <attribute name="precise" version="0" /> </rt_info> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="2956" name="__module.model.model.layers.21.self_attn/aten::view/Reshape_1" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="3774"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> </output> </layer> <layer id="2957" name="__module.model.model.layers.21.self_attn/aten::transpose/Constant_1" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="56635488" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="2958" name="__module.model.model.layers.21.self_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="3775,key_states.91"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="2959" name="__module.model.model.layers.21.self_attn/aten::mul/Multiply_2" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="3837"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="2960" name="Constant_22040" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635630" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2961" name="Constant_22042" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635638" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2962" name="Constant_22044" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2963" name="__module.model.model.layers.21.self_attn/aten::slice/Slice_4" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="3847,x2.87"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="2964" name="Constant_90249_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1, 1" offset="56635654" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2965" name="Constant_90249" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="2966" name="__module.model.model.layers.21.self_attn/aten::neg/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="3848"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="2967" name="Constant_21937" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="2" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2968" name="Constant_21981" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635630" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2969" name="Constant_21983" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2970" name="__module.model.model.layers.21.self_attn/aten::slice/Slice_5" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="3842"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="2971" name="__module.model.model.layers.21.self_attn/aten::cat/Concat_1" type="Concat" version="opset1"> <data axis="-1" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </input> <output> <port id="2" precision="FP32" names="3850"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="2972" name="__module.model.model.layers.21.self_attn/aten::mul/Multiply_3" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="3851"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="2973" name="__module.model.model.layers.21.self_attn/aten::add/Add_1" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="3852"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="2974" name="__module.model.model.layers.21.self_attn/aten::cat/Concat_2" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="hidden_states.513,present.21.key"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="2975" name="Constant_102710_compressed" type="Const" version="opset1"> <data element_type="f16" shape="" offset="0" size="2" /> <output> <port id="0" precision="FP16" /> </output> </layer> <layer id="2976" name="Constant_102710" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16" /> </input> <output> <port id="1" precision="FP32" /> </output> </layer> <layer id="2977" name="Constant_102703" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="10" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2978" name="Constant_102705" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="2" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2979" name="Constant_102707" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="18" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2980" name="Concat_102708" type="Concat" version="opset1"> <data axis="0" /> <input> <port id="0" precision="I64"> <dim>1</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="4" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="2981" name="Broadcast_102711" type="Broadcast" version="opset3"> <data mode="numpy" /> <input> <port id="0" precision="FP32" /> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>0</dim> <dim>96</dim> </port> </output> </layer> <layer id="2982" name="ReadValue_101105" type="ReadValue" version="opset6"> <data variable_id="past_key_values.21.valuepresent.21.value" variable_type="f32" variable_shape="?,32,?,96" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>0</dim> <dim>96</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.21.value"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="2983" name="Constant_99980" type="Const" version="opset1"> <data element_type="i64" shape="" offset="2" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="2984" name="Gather_99981" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="2985" name="Constant_21350" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635656" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2986" name="Constant_21352" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635638" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2987" name="Constant_21354" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="2988" name="__module.model.model.layers.21.self_attn/aten::slice/Slice_6" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>9216</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="3769,value_states.43"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2989" name="Constant_96674" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="56635456" size="32" /> <rt_info> <attribute name="precise" version="0" /> </rt_info> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="2990" name="__module.model.model.layers.21.self_attn/aten::view/Reshape_2" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="3777"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> </output> </layer> <layer id="2991" name="__module.model.model.layers.21.self_attn/aten::transpose/Constant_2" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="56635488" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="2992" name="__module.model.model.layers.21.self_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="3778"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="2993" name="__module.model.model.layers.21.self_attn/aten::cat/Concat_3" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="hidden_states.515,present.21.value"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="2994" name="__module.model.model.layers.21.self_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> <data causal="false" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="2" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="3" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>-1</dim> </port> </input> <output> <port id="4" precision="FP32" names="3862,attn_output.85"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="2995" name="__module.model.model.layers.21.self_attn/aten::transpose/Constant_3" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="56635488" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="2996" name="__module.model.model.layers.21.self_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="3863"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> </output> </layer> <layer id="2997" name="Constant_96675" type="Const" version="opset1"> <data element_type="i64" shape="3" offset="56635704" size="24" /> <rt_info> <attribute name="precise" version="0" /> </rt_info> <output> <port id="0" precision="I64"> <dim>3</dim> </port> </output> </layer> <layer id="2998" name="__module.model.model.layers.21.self_attn/aten::view/Reshape_3" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> <port id="1" precision="I64"> <dim>3</dim> </port> </input> <output> <port id="2" precision="FP32" names="3866"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="2999" name="self.model.model.layers.21.self_attn.o_proj.weight_compressed" type="Const" version="opset1"> <data element_type="f16" shape="3072, 3072" offset="4813234516" size="18874368" /> <output> <port id="0" precision="FP16" names="self.model.model.layers.21.self_attn.o_proj.weight"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3000" name="self.model.model.layers.21.self_attn.o_proj.weight" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3001" name="__module.model.model.layers.21.self_attn.o_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="3868,3870,input.127"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3002" name="__module.model.model.layers.21/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="3874,3876,3887,hidden_states.517,hidden_states.519"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3003" name="Constant_90253_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 3072" offset="4832108884" size="6144" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3004" name="Constant_90253" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3005" name="Constant_90252_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12314" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3006" name="Constant_90252" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3007" name="Constant_90250_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12316" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3008" name="Constant_90250" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3009" name="__module.model.model.layers.21.post_attention_layernorm/aten::pow/Power" type="Power" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="3877"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3010" name="Constant_22212" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="12318" size="8" /> <output> <port id="0" precision="I64" names="3878"> <dim>1</dim> </port> </output> </layer> <layer id="3011" name="__module.model.model.layers.21.post_attention_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> <data keep_dims="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="3879,variance.87"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3012" name="Constant_90251_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12326" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3013" name="Constant_90251" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3014" name="__module.model.model.layers.21.post_attention_layernorm/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="3880"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3015" name="__module.model.model.layers.21.post_attention_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3016" name="__module.model.model.layers.21.post_attention_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> <data auto_broadcast="numpy" m_pythondiv="true" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="3881"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3017" name="__module.model.model.layers.21.post_attention_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="3882,3883,hidden_states.521,hidden_states.523"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3018" name="__module.model.model.layers.21.post_attention_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="3884,3886"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3019" name="self.model.model.layers.21.mlp.gate_up_proj.weight_compressed" type="Const" version="opset1"> <data element_type="f16" shape="16384, 3072" offset="4832115028" size="100663296" /> <output> <port id="0" precision="FP16" names="self.model.model.layers.21.mlp.gate_up_proj.weight"> <dim>16384</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3020" name="self.model.model.layers.21.mlp.gate_up_proj.weight" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>16384</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>16384</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3021" name="__module.model.model.layers.21.mlp.gate_up_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>16384</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="3891,up_states.85"> <dim>-1</dim> <dim>-1</dim> <dim>16384</dim> </port> </output> </layer> <layer id="3022" name="__module.model.model.layers.21.mlp/prim::ListUnpack/VariadicSplit" type="VariadicSplit" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16384</dim> </port> <port id="1" precision="I64" /> <port id="2" precision="I32"> <dim>2</dim> </port> </input> <output> <port id="3" precision="FP32" names="3893,input.129"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> <port id="4" precision="FP32" names="3894,up_states.87"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> </output> </layer> <layer id="3023" name="__module.model.model.layers.21.mlp.activation_fn/aten::silu/Swish" type="Swish" version="opset4"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> </input> <output> <port id="1" precision="FP32" names="3895"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> </output> </layer> <layer id="3024" name="__module.model.model.layers.21.mlp/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> </input> <output> <port id="2" precision="FP32" names="3896"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> </output> </layer> <layer id="3025" name="self.model.model.layers.21.mlp.down_proj.weight_compressed" type="Const" version="opset1"> <data element_type="f16" shape="3072, 8192" offset="4932778324" size="50331648" /> <output> <port id="0" precision="FP16" names="self.model.model.layers.21.mlp.down_proj.weight"> <dim>3072</dim> <dim>8192</dim> </port> </output> </layer> <layer id="3026" name="self.model.model.layers.21.mlp.down_proj.weight" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>8192</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>3072</dim> <dim>8192</dim> </port> </output> </layer> <layer id="3027" name="__module.model.model.layers.21.mlp.down_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> <port id="1" precision="FP32"> <dim>3072</dim> <dim>8192</dim> </port> </input> <output> <port id="2" precision="FP32" names="3898,input.131"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3028" name="__module.model.model.layers.21/aten::add/Add_1" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="3900,3902,3910,3921,hidden_states.527,hidden_states.529"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3029" name="Constant_90257_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 3072" offset="4983109972" size="6144" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3030" name="Constant_90257" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3031" name="Constant_90256_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12314" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3032" name="Constant_90256" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3033" name="Constant_90254_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12316" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3034" name="Constant_90254" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3035" name="__module.model.model.layers.22.input_layernorm/aten::pow/Power" type="Power" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="3911"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3036" name="Constant_22281" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="12318" size="8" /> <output> <port id="0" precision="I64" names="3912"> <dim>1</dim> </port> </output> </layer> <layer id="3037" name="__module.model.model.layers.22.input_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> <data keep_dims="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="3913,variance.89"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3038" name="Constant_90255_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12326" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3039" name="Constant_90255" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3040" name="__module.model.model.layers.22.input_layernorm/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="3914"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3041" name="__module.model.model.layers.22.input_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3042" name="__module.model.model.layers.22.input_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> <data auto_broadcast="numpy" m_pythondiv="true" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="3915"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3043" name="__module.model.model.layers.22.input_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="3916,3917,hidden_states.531,hidden_states.533"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3044" name="__module.model.model.layers.22.input_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="3918,3920,hidden_states.535"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3045" name="self.model.model.layers.22.self_attn.qkv_proj.weight_compressed" type="Const" version="opset1"> <data element_type="f16" shape="9216, 3072" offset="4983116116" size="56623104" /> <output> <port id="0" precision="FP16" names="self.model.model.layers.22.self_attn.qkv_proj.weight"> <dim>9216</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3046" name="self.model.model.layers.22.self_attn.qkv_proj.weight" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>9216</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>9216</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3047" name="__module.model.model.layers.22.self_attn.qkv_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>9216</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="3927,qkv.45"> <dim>-1</dim> <dim>-1</dim> <dim>9216</dim> </port> </output> </layer> <layer id="3048" name="Constant_22324" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="2" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3049" name="Constant_22326" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635432" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3050" name="Constant_22328" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3051" name="__module.model.model.layers.22.self_attn/aten::slice/Slice" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>9216</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="3928,query_states.45"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3052" name="Constant_96676" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="56635456" size="32" /> <rt_info> <attribute name="precise" version="0" /> </rt_info> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="3053" name="__module.model.model.layers.22.self_attn/aten::view/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="3932"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> </output> </layer> <layer id="3054" name="__module.model.model.layers.22.self_attn/aten::transpose/Constant" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="56635488" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="3055" name="__module.model.model.layers.22.self_attn/aten::transpose/Transpose" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="3933,q.45"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="3056" name="__module.model.model.layers.22.self_attn/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="3982"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="3057" name="Constant_22891" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635630" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3058" name="Constant_22893" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635638" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3059" name="Constant_22895" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3060" name="__module.model.model.layers.22.self_attn/aten::slice/Slice_1" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="3992,x2.89"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="3061" name="Constant_90258_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1, 1" offset="56635654" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3062" name="Constant_90258" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3063" name="__module.model.model.layers.22.self_attn/aten::neg/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="3993"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="3064" name="Constant_22788" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="2" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3065" name="Constant_22832" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635630" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3066" name="Constant_22834" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3067" name="__module.model.model.layers.22.self_attn/aten::slice/Slice_2" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="3987"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="3068" name="__module.model.model.layers.22.self_attn/aten::cat/Concat" type="Concat" version="opset1"> <data axis="-1" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </input> <output> <port id="2" precision="FP32" names="3995"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="3069" name="__module.model.model.layers.22.self_attn/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="3996"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="3070" name="__module.model.model.layers.22.self_attn/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="3997"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="3071" name="Constant_102746_compressed" type="Const" version="opset1"> <data element_type="f16" shape="" offset="0" size="2" /> <output> <port id="0" precision="FP16" /> </output> </layer> <layer id="3072" name="Constant_102746" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16" /> </input> <output> <port id="1" precision="FP32" /> </output> </layer> <layer id="3073" name="Constant_102739" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="10" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3074" name="Constant_102741" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="2" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3075" name="Constant_102743" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="18" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3076" name="Concat_102744" type="Concat" version="opset1"> <data axis="0" /> <input> <port id="0" precision="I64"> <dim>1</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="4" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="3077" name="Broadcast_102747" type="Broadcast" version="opset3"> <data mode="numpy" /> <input> <port id="0" precision="FP32" /> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>0</dim> <dim>96</dim> </port> </output> </layer> <layer id="3078" name="ReadValue_101107" type="ReadValue" version="opset6"> <data variable_id="past_key_values.22.keypresent.22.key" variable_type="f32" variable_shape="?,32,?,96" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>0</dim> <dim>96</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.22.key"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="3079" name="Constant_99983" type="Const" version="opset1"> <data element_type="i64" shape="" offset="2" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="3080" name="Gather_99984" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="3081" name="Constant_22334" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635432" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3082" name="Constant_22336" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635656" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3083" name="Constant_22338" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3084" name="__module.model.model.layers.22.self_attn/aten::slice/Slice_3" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>9216</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="3929,key_states.93"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3085" name="Constant_96677" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="56635456" size="32" /> <rt_info> <attribute name="precise" version="0" /> </rt_info> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="3086" name="__module.model.model.layers.22.self_attn/aten::view/Reshape_1" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="3935"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> </output> </layer> <layer id="3087" name="__module.model.model.layers.22.self_attn/aten::transpose/Constant_1" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="56635488" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="3088" name="__module.model.model.layers.22.self_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="3936,key_states.95"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="3089" name="__module.model.model.layers.22.self_attn/aten::mul/Multiply_2" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="3998"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="3090" name="Constant_23034" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635630" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3091" name="Constant_23036" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635638" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3092" name="Constant_23038" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3093" name="__module.model.model.layers.22.self_attn/aten::slice/Slice_4" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="4008,x2.91"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="3094" name="Constant_90259_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1, 1" offset="56635654" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3095" name="Constant_90259" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3096" name="__module.model.model.layers.22.self_attn/aten::neg/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="4009"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="3097" name="Constant_22931" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="2" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3098" name="Constant_22975" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635630" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3099" name="Constant_22977" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3100" name="__module.model.model.layers.22.self_attn/aten::slice/Slice_5" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="4003"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="3101" name="__module.model.model.layers.22.self_attn/aten::cat/Concat_1" type="Concat" version="opset1"> <data axis="-1" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </input> <output> <port id="2" precision="FP32" names="4011"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="3102" name="__module.model.model.layers.22.self_attn/aten::mul/Multiply_3" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="4012"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="3103" name="__module.model.model.layers.22.self_attn/aten::add/Add_1" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="4013"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="3104" name="__module.model.model.layers.22.self_attn/aten::cat/Concat_2" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="hidden_states.537,present.22.key"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="3105" name="Constant_102734_compressed" type="Const" version="opset1"> <data element_type="f16" shape="" offset="0" size="2" /> <output> <port id="0" precision="FP16" /> </output> </layer> <layer id="3106" name="Constant_102734" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16" /> </input> <output> <port id="1" precision="FP32" /> </output> </layer> <layer id="3107" name="Constant_102727" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="10" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3108" name="Constant_102729" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="2" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3109" name="Constant_102731" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="18" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3110" name="Concat_102732" type="Concat" version="opset1"> <data axis="0" /> <input> <port id="0" precision="I64"> <dim>1</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="4" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="3111" name="Broadcast_102735" type="Broadcast" version="opset3"> <data mode="numpy" /> <input> <port id="0" precision="FP32" /> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>0</dim> <dim>96</dim> </port> </output> </layer> <layer id="3112" name="ReadValue_101109" type="ReadValue" version="opset6"> <data variable_id="past_key_values.22.valuepresent.22.value" variable_type="f32" variable_shape="?,32,?,96" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>0</dim> <dim>96</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.22.value"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="3113" name="Constant_99986" type="Const" version="opset1"> <data element_type="i64" shape="" offset="2" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="3114" name="Gather_99987" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="3115" name="Constant_22344" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635656" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3116" name="Constant_22346" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635638" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3117" name="Constant_22348" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3118" name="__module.model.model.layers.22.self_attn/aten::slice/Slice_6" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>9216</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="3930,value_states.45"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3119" name="Constant_96678" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="56635456" size="32" /> <rt_info> <attribute name="precise" version="0" /> </rt_info> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="3120" name="__module.model.model.layers.22.self_attn/aten::view/Reshape_2" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="3938"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> </output> </layer> <layer id="3121" name="__module.model.model.layers.22.self_attn/aten::transpose/Constant_2" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="56635488" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="3122" name="__module.model.model.layers.22.self_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="3939"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="3123" name="__module.model.model.layers.22.self_attn/aten::cat/Concat_3" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="hidden_states.539,present.22.value"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="3124" name="__module.model.model.layers.22.self_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> <data causal="false" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="2" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="3" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>-1</dim> </port> </input> <output> <port id="4" precision="FP32" names="4023,attn_output.89"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="3125" name="__module.model.model.layers.22.self_attn/aten::transpose/Constant_3" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="56635488" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="3126" name="__module.model.model.layers.22.self_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="4024"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> </output> </layer> <layer id="3127" name="Constant_96679" type="Const" version="opset1"> <data element_type="i64" shape="3" offset="56635704" size="24" /> <rt_info> <attribute name="precise" version="0" /> </rt_info> <output> <port id="0" precision="I64"> <dim>3</dim> </port> </output> </layer> <layer id="3128" name="__module.model.model.layers.22.self_attn/aten::view/Reshape_3" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> <port id="1" precision="I64"> <dim>3</dim> </port> </input> <output> <port id="2" precision="FP32" names="4027"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3129" name="self.model.model.layers.22.self_attn.o_proj.weight_compressed" type="Const" version="opset1"> <data element_type="f16" shape="3072, 3072" offset="5039739220" size="18874368" /> <output> <port id="0" precision="FP16" names="self.model.model.layers.22.self_attn.o_proj.weight"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3130" name="self.model.model.layers.22.self_attn.o_proj.weight" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3131" name="__module.model.model.layers.22.self_attn.o_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="4029,4031,input.133"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3132" name="__module.model.model.layers.22/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="4035,4037,4048,hidden_states.541,hidden_states.543"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3133" name="Constant_90263_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 3072" offset="5058613588" size="6144" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3134" name="Constant_90263" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3135" name="Constant_90262_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12314" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3136" name="Constant_90262" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3137" name="Constant_90260_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12316" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3138" name="Constant_90260" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3139" name="__module.model.model.layers.22.post_attention_layernorm/aten::pow/Power" type="Power" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="4038"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3140" name="Constant_23206" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="12318" size="8" /> <output> <port id="0" precision="I64" names="4039"> <dim>1</dim> </port> </output> </layer> <layer id="3141" name="__module.model.model.layers.22.post_attention_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> <data keep_dims="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="4040,variance.91"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3142" name="Constant_90261_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12326" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3143" name="Constant_90261" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3144" name="__module.model.model.layers.22.post_attention_layernorm/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="4041"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3145" name="__module.model.model.layers.22.post_attention_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3146" name="__module.model.model.layers.22.post_attention_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> <data auto_broadcast="numpy" m_pythondiv="true" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="4042"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3147" name="__module.model.model.layers.22.post_attention_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="4043,4044,hidden_states.545,hidden_states.547"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3148" name="__module.model.model.layers.22.post_attention_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="4045,4047"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3149" name="self.model.model.layers.22.mlp.gate_up_proj.weight_compressed" type="Const" version="opset1"> <data element_type="f16" shape="16384, 3072" offset="5058619732" size="100663296" /> <output> <port id="0" precision="FP16" names="self.model.model.layers.22.mlp.gate_up_proj.weight"> <dim>16384</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3150" name="self.model.model.layers.22.mlp.gate_up_proj.weight" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>16384</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>16384</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3151" name="__module.model.model.layers.22.mlp.gate_up_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>16384</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="4052,up_states.89"> <dim>-1</dim> <dim>-1</dim> <dim>16384</dim> </port> </output> </layer> <layer id="3152" name="__module.model.model.layers.22.mlp/prim::ListUnpack/VariadicSplit" type="VariadicSplit" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16384</dim> </port> <port id="1" precision="I64" /> <port id="2" precision="I32"> <dim>2</dim> </port> </input> <output> <port id="3" precision="FP32" names="4054,input.135"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> <port id="4" precision="FP32" names="4055,up_states.91"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> </output> </layer> <layer id="3153" name="__module.model.model.layers.22.mlp.activation_fn/aten::silu/Swish" type="Swish" version="opset4"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> </input> <output> <port id="1" precision="FP32" names="4056"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> </output> </layer> <layer id="3154" name="__module.model.model.layers.22.mlp/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> </input> <output> <port id="2" precision="FP32" names="4057"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> </output> </layer> <layer id="3155" name="self.model.model.layers.22.mlp.down_proj.weight_compressed" type="Const" version="opset1"> <data element_type="f16" shape="3072, 8192" offset="5159283028" size="50331648" /> <output> <port id="0" precision="FP16" names="self.model.model.layers.22.mlp.down_proj.weight"> <dim>3072</dim> <dim>8192</dim> </port> </output> </layer> <layer id="3156" name="self.model.model.layers.22.mlp.down_proj.weight" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>8192</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>3072</dim> <dim>8192</dim> </port> </output> </layer> <layer id="3157" name="__module.model.model.layers.22.mlp.down_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> <port id="1" precision="FP32"> <dim>3072</dim> <dim>8192</dim> </port> </input> <output> <port id="2" precision="FP32" names="4059,input.137"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3158" name="__module.model.model.layers.22/aten::add/Add_1" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="4061,4063,4071,4082,hidden_states.551,hidden_states.553"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3159" name="Constant_90267_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 3072" offset="5209614676" size="6144" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3160" name="Constant_90267" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3161" name="Constant_90266_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12314" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3162" name="Constant_90266" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3163" name="Constant_90264_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12316" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3164" name="Constant_90264" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3165" name="__module.model.model.layers.23.input_layernorm/aten::pow/Power" type="Power" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="4072"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3166" name="Constant_23275" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="12318" size="8" /> <output> <port id="0" precision="I64" names="4073"> <dim>1</dim> </port> </output> </layer> <layer id="3167" name="__module.model.model.layers.23.input_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> <data keep_dims="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="4074,variance.93"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3168" name="Constant_90265_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12326" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3169" name="Constant_90265" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3170" name="__module.model.model.layers.23.input_layernorm/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="4075"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3171" name="__module.model.model.layers.23.input_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3172" name="__module.model.model.layers.23.input_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> <data auto_broadcast="numpy" m_pythondiv="true" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="4076"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3173" name="__module.model.model.layers.23.input_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="4077,4078,hidden_states.555,hidden_states.557"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3174" name="__module.model.model.layers.23.input_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="4079,4081,hidden_states.559"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3175" name="self.model.model.layers.23.self_attn.qkv_proj.weight_compressed" type="Const" version="opset1"> <data element_type="f16" shape="9216, 3072" offset="5209620820" size="56623104" /> <output> <port id="0" precision="FP16" names="self.model.model.layers.23.self_attn.qkv_proj.weight"> <dim>9216</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3176" name="self.model.model.layers.23.self_attn.qkv_proj.weight" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>9216</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>9216</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3177" name="__module.model.model.layers.23.self_attn.qkv_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>9216</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="4088,qkv.47"> <dim>-1</dim> <dim>-1</dim> <dim>9216</dim> </port> </output> </layer> <layer id="3178" name="Constant_23318" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="2" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3179" name="Constant_23320" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635432" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3180" name="Constant_23322" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3181" name="__module.model.model.layers.23.self_attn/aten::slice/Slice" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>9216</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="4089,query_states.47"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3182" name="Constant_96680" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="56635456" size="32" /> <rt_info> <attribute name="precise" version="0" /> </rt_info> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="3183" name="__module.model.model.layers.23.self_attn/aten::view/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="4093"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> </output> </layer> <layer id="3184" name="__module.model.model.layers.23.self_attn/aten::transpose/Constant" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="56635488" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="3185" name="__module.model.model.layers.23.self_attn/aten::transpose/Transpose" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="4094,q.47"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="3186" name="__module.model.model.layers.23.self_attn/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="4143"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="3187" name="Constant_23885" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635630" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3188" name="Constant_23887" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635638" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3189" name="Constant_23889" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3190" name="__module.model.model.layers.23.self_attn/aten::slice/Slice_1" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="4153,x2.93"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="3191" name="Constant_90268_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1, 1" offset="56635654" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3192" name="Constant_90268" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3193" name="__module.model.model.layers.23.self_attn/aten::neg/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="4154"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="3194" name="Constant_23782" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="2" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3195" name="Constant_23826" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635630" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3196" name="Constant_23828" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3197" name="__module.model.model.layers.23.self_attn/aten::slice/Slice_2" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="4148"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="3198" name="__module.model.model.layers.23.self_attn/aten::cat/Concat" type="Concat" version="opset1"> <data axis="-1" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </input> <output> <port id="2" precision="FP32" names="4156"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="3199" name="__module.model.model.layers.23.self_attn/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="4157"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="3200" name="__module.model.model.layers.23.self_attn/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="4158"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="3201" name="Constant_102770_compressed" type="Const" version="opset1"> <data element_type="f16" shape="" offset="0" size="2" /> <output> <port id="0" precision="FP16" /> </output> </layer> <layer id="3202" name="Constant_102770" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16" /> </input> <output> <port id="1" precision="FP32" /> </output> </layer> <layer id="3203" name="Constant_102763" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="10" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3204" name="Constant_102765" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="2" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3205" name="Constant_102767" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="18" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3206" name="Concat_102768" type="Concat" version="opset1"> <data axis="0" /> <input> <port id="0" precision="I64"> <dim>1</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="4" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="3207" name="Broadcast_102771" type="Broadcast" version="opset3"> <data mode="numpy" /> <input> <port id="0" precision="FP32" /> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>0</dim> <dim>96</dim> </port> </output> </layer> <layer id="3208" name="ReadValue_101111" type="ReadValue" version="opset6"> <data variable_id="past_key_values.23.keypresent.23.key" variable_type="f32" variable_shape="?,32,?,96" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>0</dim> <dim>96</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.23.key"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="3209" name="Constant_99989" type="Const" version="opset1"> <data element_type="i64" shape="" offset="2" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="3210" name="Gather_99990" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="3211" name="Constant_23328" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635432" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3212" name="Constant_23330" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635656" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3213" name="Constant_23332" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3214" name="__module.model.model.layers.23.self_attn/aten::slice/Slice_3" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>9216</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="4090,key_states.97"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3215" name="Constant_96681" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="56635456" size="32" /> <rt_info> <attribute name="precise" version="0" /> </rt_info> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="3216" name="__module.model.model.layers.23.self_attn/aten::view/Reshape_1" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="4096"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> </output> </layer> <layer id="3217" name="__module.model.model.layers.23.self_attn/aten::transpose/Constant_1" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="56635488" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="3218" name="__module.model.model.layers.23.self_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="4097,key_states.99"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="3219" name="__module.model.model.layers.23.self_attn/aten::mul/Multiply_2" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="4159"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="3220" name="Constant_24028" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635630" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3221" name="Constant_24030" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635638" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3222" name="Constant_24032" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3223" name="__module.model.model.layers.23.self_attn/aten::slice/Slice_4" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="4169,x2.95"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="3224" name="Constant_90269_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1, 1" offset="56635654" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3225" name="Constant_90269" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3226" name="__module.model.model.layers.23.self_attn/aten::neg/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="4170"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="3227" name="Constant_23925" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="2" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3228" name="Constant_23969" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635630" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3229" name="Constant_23971" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3230" name="__module.model.model.layers.23.self_attn/aten::slice/Slice_5" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="4164"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="3231" name="__module.model.model.layers.23.self_attn/aten::cat/Concat_1" type="Concat" version="opset1"> <data axis="-1" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </input> <output> <port id="2" precision="FP32" names="4172"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="3232" name="__module.model.model.layers.23.self_attn/aten::mul/Multiply_3" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="4173"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="3233" name="__module.model.model.layers.23.self_attn/aten::add/Add_1" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="4174"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="3234" name="__module.model.model.layers.23.self_attn/aten::cat/Concat_2" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="hidden_states.561,present.23.key"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="3235" name="Constant_102758_compressed" type="Const" version="opset1"> <data element_type="f16" shape="" offset="0" size="2" /> <output> <port id="0" precision="FP16" /> </output> </layer> <layer id="3236" name="Constant_102758" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16" /> </input> <output> <port id="1" precision="FP32" /> </output> </layer> <layer id="3237" name="Constant_102751" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="10" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3238" name="Constant_102753" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="2" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3239" name="Constant_102755" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="18" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3240" name="Concat_102756" type="Concat" version="opset1"> <data axis="0" /> <input> <port id="0" precision="I64"> <dim>1</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="4" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="3241" name="Broadcast_102759" type="Broadcast" version="opset3"> <data mode="numpy" /> <input> <port id="0" precision="FP32" /> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>0</dim> <dim>96</dim> </port> </output> </layer> <layer id="3242" name="ReadValue_101113" type="ReadValue" version="opset6"> <data variable_id="past_key_values.23.valuepresent.23.value" variable_type="f32" variable_shape="?,32,?,96" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>0</dim> <dim>96</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.23.value"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="3243" name="Constant_99992" type="Const" version="opset1"> <data element_type="i64" shape="" offset="2" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="3244" name="Gather_99993" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="3245" name="Constant_23338" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635656" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3246" name="Constant_23340" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635638" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3247" name="Constant_23342" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3248" name="__module.model.model.layers.23.self_attn/aten::slice/Slice_6" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>9216</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="4091,value_states.47"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3249" name="Constant_96682" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="56635456" size="32" /> <rt_info> <attribute name="precise" version="0" /> </rt_info> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="3250" name="__module.model.model.layers.23.self_attn/aten::view/Reshape_2" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="4099"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> </output> </layer> <layer id="3251" name="__module.model.model.layers.23.self_attn/aten::transpose/Constant_2" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="56635488" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="3252" name="__module.model.model.layers.23.self_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="4100"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="3253" name="__module.model.model.layers.23.self_attn/aten::cat/Concat_3" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="hidden_states.563,present.23.value"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="3254" name="__module.model.model.layers.23.self_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> <data causal="false" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="2" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="3" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>-1</dim> </port> </input> <output> <port id="4" precision="FP32" names="4184,attn_output.93"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="3255" name="__module.model.model.layers.23.self_attn/aten::transpose/Constant_3" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="56635488" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="3256" name="__module.model.model.layers.23.self_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="4185"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> </output> </layer> <layer id="3257" name="Constant_96683" type="Const" version="opset1"> <data element_type="i64" shape="3" offset="56635704" size="24" /> <rt_info> <attribute name="precise" version="0" /> </rt_info> <output> <port id="0" precision="I64"> <dim>3</dim> </port> </output> </layer> <layer id="3258" name="__module.model.model.layers.23.self_attn/aten::view/Reshape_3" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> <port id="1" precision="I64"> <dim>3</dim> </port> </input> <output> <port id="2" precision="FP32" names="4188"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3259" name="self.model.model.layers.23.self_attn.o_proj.weight_compressed" type="Const" version="opset1"> <data element_type="f16" shape="3072, 3072" offset="5266243924" size="18874368" /> <output> <port id="0" precision="FP16" names="self.model.model.layers.23.self_attn.o_proj.weight"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3260" name="self.model.model.layers.23.self_attn.o_proj.weight" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3261" name="__module.model.model.layers.23.self_attn.o_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="4190,4192,input.139"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3262" name="__module.model.model.layers.23/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="4196,4198,4209,hidden_states.565,hidden_states.567"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3263" name="Constant_90273_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 3072" offset="5285118292" size="6144" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3264" name="Constant_90273" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3265" name="Constant_90272_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12314" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3266" name="Constant_90272" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3267" name="Constant_90270_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12316" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3268" name="Constant_90270" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3269" name="__module.model.model.layers.23.post_attention_layernorm/aten::pow/Power" type="Power" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="4199"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3270" name="Constant_24200" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="12318" size="8" /> <output> <port id="0" precision="I64" names="4200"> <dim>1</dim> </port> </output> </layer> <layer id="3271" name="__module.model.model.layers.23.post_attention_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> <data keep_dims="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="4201,variance.95"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3272" name="Constant_90271_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12326" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3273" name="Constant_90271" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3274" name="__module.model.model.layers.23.post_attention_layernorm/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="4202"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3275" name="__module.model.model.layers.23.post_attention_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3276" name="__module.model.model.layers.23.post_attention_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> <data auto_broadcast="numpy" m_pythondiv="true" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="4203"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3277" name="__module.model.model.layers.23.post_attention_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="4204,4205,hidden_states.569,hidden_states.571"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3278" name="__module.model.model.layers.23.post_attention_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="4206,4208"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3279" name="self.model.model.layers.23.mlp.gate_up_proj.weight_compressed" type="Const" version="opset1"> <data element_type="f16" shape="16384, 3072" offset="5285124436" size="100663296" /> <output> <port id="0" precision="FP16" names="self.model.model.layers.23.mlp.gate_up_proj.weight"> <dim>16384</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3280" name="self.model.model.layers.23.mlp.gate_up_proj.weight" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>16384</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>16384</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3281" name="__module.model.model.layers.23.mlp.gate_up_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>16384</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="4213,up_states.93"> <dim>-1</dim> <dim>-1</dim> <dim>16384</dim> </port> </output> </layer> <layer id="3282" name="__module.model.model.layers.23.mlp/prim::ListUnpack/VariadicSplit" type="VariadicSplit" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16384</dim> </port> <port id="1" precision="I64" /> <port id="2" precision="I32"> <dim>2</dim> </port> </input> <output> <port id="3" precision="FP32" names="4215,input.141"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> <port id="4" precision="FP32" names="4216,up_states.95"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> </output> </layer> <layer id="3283" name="__module.model.model.layers.23.mlp.activation_fn/aten::silu/Swish" type="Swish" version="opset4"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> </input> <output> <port id="1" precision="FP32" names="4217"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> </output> </layer> <layer id="3284" name="__module.model.model.layers.23.mlp/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> </input> <output> <port id="2" precision="FP32" names="4218"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> </output> </layer> <layer id="3285" name="self.model.model.layers.23.mlp.down_proj.weight_compressed" type="Const" version="opset1"> <data element_type="f16" shape="3072, 8192" offset="5385787732" size="50331648" /> <output> <port id="0" precision="FP16" names="self.model.model.layers.23.mlp.down_proj.weight"> <dim>3072</dim> <dim>8192</dim> </port> </output> </layer> <layer id="3286" name="self.model.model.layers.23.mlp.down_proj.weight" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>8192</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>3072</dim> <dim>8192</dim> </port> </output> </layer> <layer id="3287" name="__module.model.model.layers.23.mlp.down_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> <port id="1" precision="FP32"> <dim>3072</dim> <dim>8192</dim> </port> </input> <output> <port id="2" precision="FP32" names="4220,input.143"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3288" name="__module.model.model.layers.23/aten::add/Add_1" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="4222,4224,4232,4243,hidden_states.575,hidden_states.577"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3289" name="Constant_90277_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 3072" offset="5436119380" size="6144" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3290" name="Constant_90277" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3291" name="Constant_90276_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12314" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3292" name="Constant_90276" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3293" name="Constant_90274_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12316" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3294" name="Constant_90274" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3295" name="__module.model.model.layers.24.input_layernorm/aten::pow/Power" type="Power" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="4233"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3296" name="Constant_24269" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="12318" size="8" /> <output> <port id="0" precision="I64" names="4234"> <dim>1</dim> </port> </output> </layer> <layer id="3297" name="__module.model.model.layers.24.input_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> <data keep_dims="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="4235,variance.97"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3298" name="Constant_90275_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12326" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3299" name="Constant_90275" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3300" name="__module.model.model.layers.24.input_layernorm/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="4236"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3301" name="__module.model.model.layers.24.input_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3302" name="__module.model.model.layers.24.input_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> <data auto_broadcast="numpy" m_pythondiv="true" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="4237"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3303" name="__module.model.model.layers.24.input_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="4238,4239,hidden_states.579,hidden_states.581"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3304" name="__module.model.model.layers.24.input_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="4240,4242,hidden_states.583"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3305" name="self.model.model.layers.24.self_attn.qkv_proj.weight_compressed" type="Const" version="opset1"> <data element_type="f16" shape="9216, 3072" offset="5436125524" size="56623104" /> <output> <port id="0" precision="FP16" names="self.model.model.layers.24.self_attn.qkv_proj.weight"> <dim>9216</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3306" name="self.model.model.layers.24.self_attn.qkv_proj.weight" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>9216</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>9216</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3307" name="__module.model.model.layers.24.self_attn.qkv_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>9216</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="4249,qkv.49"> <dim>-1</dim> <dim>-1</dim> <dim>9216</dim> </port> </output> </layer> <layer id="3308" name="Constant_24312" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="2" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3309" name="Constant_24314" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635432" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3310" name="Constant_24316" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3311" name="__module.model.model.layers.24.self_attn/aten::slice/Slice" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>9216</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="4250,query_states.49"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3312" name="Constant_96684" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="56635456" size="32" /> <rt_info> <attribute name="precise" version="0" /> </rt_info> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="3313" name="__module.model.model.layers.24.self_attn/aten::view/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="4254"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> </output> </layer> <layer id="3314" name="__module.model.model.layers.24.self_attn/aten::transpose/Constant" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="56635488" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="3315" name="__module.model.model.layers.24.self_attn/aten::transpose/Transpose" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="4255,q.49"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="3316" name="__module.model.model.layers.24.self_attn/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="4304"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="3317" name="Constant_24879" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635630" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3318" name="Constant_24881" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635638" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3319" name="Constant_24883" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3320" name="__module.model.model.layers.24.self_attn/aten::slice/Slice_1" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="4314,x2.97"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="3321" name="Constant_90278_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1, 1" offset="56635654" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3322" name="Constant_90278" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3323" name="__module.model.model.layers.24.self_attn/aten::neg/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="4315"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="3324" name="Constant_24776" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="2" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3325" name="Constant_24820" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635630" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3326" name="Constant_24822" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3327" name="__module.model.model.layers.24.self_attn/aten::slice/Slice_2" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="4309"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="3328" name="__module.model.model.layers.24.self_attn/aten::cat/Concat" type="Concat" version="opset1"> <data axis="-1" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </input> <output> <port id="2" precision="FP32" names="4317"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="3329" name="__module.model.model.layers.24.self_attn/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="4318"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="3330" name="__module.model.model.layers.24.self_attn/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="4319"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="3331" name="Constant_102794_compressed" type="Const" version="opset1"> <data element_type="f16" shape="" offset="0" size="2" /> <output> <port id="0" precision="FP16" /> </output> </layer> <layer id="3332" name="Constant_102794" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16" /> </input> <output> <port id="1" precision="FP32" /> </output> </layer> <layer id="3333" name="Constant_102787" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="10" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3334" name="Constant_102789" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="2" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3335" name="Constant_102791" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="18" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3336" name="Concat_102792" type="Concat" version="opset1"> <data axis="0" /> <input> <port id="0" precision="I64"> <dim>1</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="4" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="3337" name="Broadcast_102795" type="Broadcast" version="opset3"> <data mode="numpy" /> <input> <port id="0" precision="FP32" /> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>0</dim> <dim>96</dim> </port> </output> </layer> <layer id="3338" name="ReadValue_101115" type="ReadValue" version="opset6"> <data variable_id="past_key_values.24.keypresent.24.key" variable_type="f32" variable_shape="?,32,?,96" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>0</dim> <dim>96</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.24.key"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="3339" name="Constant_99995" type="Const" version="opset1"> <data element_type="i64" shape="" offset="2" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="3340" name="Gather_99996" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="3341" name="Constant_24322" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635432" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3342" name="Constant_24324" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635656" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3343" name="Constant_24326" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3344" name="__module.model.model.layers.24.self_attn/aten::slice/Slice_3" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>9216</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="4251,key_states.101"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3345" name="Constant_96685" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="56635456" size="32" /> <rt_info> <attribute name="precise" version="0" /> </rt_info> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="3346" name="__module.model.model.layers.24.self_attn/aten::view/Reshape_1" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="4257"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> </output> </layer> <layer id="3347" name="__module.model.model.layers.24.self_attn/aten::transpose/Constant_1" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="56635488" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="3348" name="__module.model.model.layers.24.self_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="4258,key_states.103"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="3349" name="__module.model.model.layers.24.self_attn/aten::mul/Multiply_2" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="4320"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="3350" name="Constant_25022" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635630" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3351" name="Constant_25024" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635638" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3352" name="Constant_25026" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3353" name="__module.model.model.layers.24.self_attn/aten::slice/Slice_4" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="4330,x2.99"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="3354" name="Constant_90279_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1, 1" offset="56635654" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3355" name="Constant_90279" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3356" name="__module.model.model.layers.24.self_attn/aten::neg/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="4331"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="3357" name="Constant_24919" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="2" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3358" name="Constant_24963" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635630" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3359" name="Constant_24965" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3360" name="__module.model.model.layers.24.self_attn/aten::slice/Slice_5" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="4325"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="3361" name="__module.model.model.layers.24.self_attn/aten::cat/Concat_1" type="Concat" version="opset1"> <data axis="-1" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </input> <output> <port id="2" precision="FP32" names="4333"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="3362" name="__module.model.model.layers.24.self_attn/aten::mul/Multiply_3" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="4334"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="3363" name="__module.model.model.layers.24.self_attn/aten::add/Add_1" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="4335"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="3364" name="__module.model.model.layers.24.self_attn/aten::cat/Concat_2" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="hidden_states.585,present.24.key"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="3365" name="Constant_102782_compressed" type="Const" version="opset1"> <data element_type="f16" shape="" offset="0" size="2" /> <output> <port id="0" precision="FP16" /> </output> </layer> <layer id="3366" name="Constant_102782" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16" /> </input> <output> <port id="1" precision="FP32" /> </output> </layer> <layer id="3367" name="Constant_102775" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="10" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3368" name="Constant_102777" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="2" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3369" name="Constant_102779" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="18" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3370" name="Concat_102780" type="Concat" version="opset1"> <data axis="0" /> <input> <port id="0" precision="I64"> <dim>1</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="4" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="3371" name="Broadcast_102783" type="Broadcast" version="opset3"> <data mode="numpy" /> <input> <port id="0" precision="FP32" /> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>0</dim> <dim>96</dim> </port> </output> </layer> <layer id="3372" name="ReadValue_101117" type="ReadValue" version="opset6"> <data variable_id="past_key_values.24.valuepresent.24.value" variable_type="f32" variable_shape="?,32,?,96" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>0</dim> <dim>96</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.24.value"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="3373" name="Constant_99998" type="Const" version="opset1"> <data element_type="i64" shape="" offset="2" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="3374" name="Gather_99999" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="3375" name="Constant_24332" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635656" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3376" name="Constant_24334" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635638" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3377" name="Constant_24336" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3378" name="__module.model.model.layers.24.self_attn/aten::slice/Slice_6" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>9216</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="4252,value_states.49"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3379" name="Constant_96686" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="56635456" size="32" /> <rt_info> <attribute name="precise" version="0" /> </rt_info> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="3380" name="__module.model.model.layers.24.self_attn/aten::view/Reshape_2" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="4260"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> </output> </layer> <layer id="3381" name="__module.model.model.layers.24.self_attn/aten::transpose/Constant_2" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="56635488" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="3382" name="__module.model.model.layers.24.self_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="4261"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="3383" name="__module.model.model.layers.24.self_attn/aten::cat/Concat_3" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="hidden_states.587,present.24.value"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="3384" name="__module.model.model.layers.24.self_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> <data causal="false" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="2" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="3" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>-1</dim> </port> </input> <output> <port id="4" precision="FP32" names="4345,attn_output.97"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="3385" name="__module.model.model.layers.24.self_attn/aten::transpose/Constant_3" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="56635488" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="3386" name="__module.model.model.layers.24.self_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="4346"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> </output> </layer> <layer id="3387" name="Constant_96687" type="Const" version="opset1"> <data element_type="i64" shape="3" offset="56635704" size="24" /> <rt_info> <attribute name="precise" version="0" /> </rt_info> <output> <port id="0" precision="I64"> <dim>3</dim> </port> </output> </layer> <layer id="3388" name="__module.model.model.layers.24.self_attn/aten::view/Reshape_3" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> <port id="1" precision="I64"> <dim>3</dim> </port> </input> <output> <port id="2" precision="FP32" names="4349"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3389" name="self.model.model.layers.24.self_attn.o_proj.weight_compressed" type="Const" version="opset1"> <data element_type="f16" shape="3072, 3072" offset="5492748628" size="18874368" /> <output> <port id="0" precision="FP16" names="self.model.model.layers.24.self_attn.o_proj.weight"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3390" name="self.model.model.layers.24.self_attn.o_proj.weight" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3391" name="__module.model.model.layers.24.self_attn.o_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="4351,4353,input.145"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3392" name="__module.model.model.layers.24/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="4357,4359,4370,hidden_states.589,hidden_states.591"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3393" name="Constant_90283_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 3072" offset="5511622996" size="6144" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3394" name="Constant_90283" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3395" name="Constant_90282_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12314" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3396" name="Constant_90282" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3397" name="Constant_90280_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12316" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3398" name="Constant_90280" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3399" name="__module.model.model.layers.24.post_attention_layernorm/aten::pow/Power" type="Power" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="4360"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3400" name="Constant_25194" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="12318" size="8" /> <output> <port id="0" precision="I64" names="4361"> <dim>1</dim> </port> </output> </layer> <layer id="3401" name="__module.model.model.layers.24.post_attention_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> <data keep_dims="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="4362,variance.99"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3402" name="Constant_90281_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12326" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3403" name="Constant_90281" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3404" name="__module.model.model.layers.24.post_attention_layernorm/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="4363"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3405" name="__module.model.model.layers.24.post_attention_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3406" name="__module.model.model.layers.24.post_attention_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> <data auto_broadcast="numpy" m_pythondiv="true" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="4364"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3407" name="__module.model.model.layers.24.post_attention_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="4365,4366,hidden_states.593,hidden_states.595"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3408" name="__module.model.model.layers.24.post_attention_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="4367,4369"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3409" name="self.model.model.layers.24.mlp.gate_up_proj.weight_compressed" type="Const" version="opset1"> <data element_type="f16" shape="16384, 3072" offset="5511629140" size="100663296" /> <output> <port id="0" precision="FP16" names="self.model.model.layers.24.mlp.gate_up_proj.weight"> <dim>16384</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3410" name="self.model.model.layers.24.mlp.gate_up_proj.weight" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>16384</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>16384</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3411" name="__module.model.model.layers.24.mlp.gate_up_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>16384</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="4374,up_states.97"> <dim>-1</dim> <dim>-1</dim> <dim>16384</dim> </port> </output> </layer> <layer id="3412" name="__module.model.model.layers.24.mlp/prim::ListUnpack/VariadicSplit" type="VariadicSplit" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16384</dim> </port> <port id="1" precision="I64" /> <port id="2" precision="I32"> <dim>2</dim> </port> </input> <output> <port id="3" precision="FP32" names="4376,input.147"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> <port id="4" precision="FP32" names="4377,up_states.99"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> </output> </layer> <layer id="3413" name="__module.model.model.layers.24.mlp.activation_fn/aten::silu/Swish" type="Swish" version="opset4"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> </input> <output> <port id="1" precision="FP32" names="4378"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> </output> </layer> <layer id="3414" name="__module.model.model.layers.24.mlp/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> </input> <output> <port id="2" precision="FP32" names="4379"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> </output> </layer> <layer id="3415" name="self.model.model.layers.24.mlp.down_proj.weight_compressed" type="Const" version="opset1"> <data element_type="f16" shape="3072, 8192" offset="5612292436" size="50331648" /> <output> <port id="0" precision="FP16" names="self.model.model.layers.24.mlp.down_proj.weight"> <dim>3072</dim> <dim>8192</dim> </port> </output> </layer> <layer id="3416" name="self.model.model.layers.24.mlp.down_proj.weight" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>8192</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>3072</dim> <dim>8192</dim> </port> </output> </layer> <layer id="3417" name="__module.model.model.layers.24.mlp.down_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> <port id="1" precision="FP32"> <dim>3072</dim> <dim>8192</dim> </port> </input> <output> <port id="2" precision="FP32" names="4381,input.149"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3418" name="__module.model.model.layers.24/aten::add/Add_1" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="4383,4385,4393,4404,hidden_states.599,hidden_states.601"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3419" name="Constant_90287_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 3072" offset="5662624084" size="6144" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3420" name="Constant_90287" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3421" name="Constant_90286_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12314" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3422" name="Constant_90286" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3423" name="Constant_90284_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12316" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3424" name="Constant_90284" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3425" name="__module.model.model.layers.25.input_layernorm/aten::pow/Power" type="Power" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="4394"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3426" name="Constant_25263" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="12318" size="8" /> <output> <port id="0" precision="I64" names="4395"> <dim>1</dim> </port> </output> </layer> <layer id="3427" name="__module.model.model.layers.25.input_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> <data keep_dims="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="4396,variance.101"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3428" name="Constant_90285_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12326" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3429" name="Constant_90285" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3430" name="__module.model.model.layers.25.input_layernorm/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="4397"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3431" name="__module.model.model.layers.25.input_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3432" name="__module.model.model.layers.25.input_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> <data auto_broadcast="numpy" m_pythondiv="true" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="4398"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3433" name="__module.model.model.layers.25.input_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="4399,4400,hidden_states.603,hidden_states.605"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3434" name="__module.model.model.layers.25.input_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="4401,4403,hidden_states.607"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3435" name="self.model.model.layers.25.self_attn.qkv_proj.weight_compressed" type="Const" version="opset1"> <data element_type="f16" shape="9216, 3072" offset="5662630228" size="56623104" /> <output> <port id="0" precision="FP16" names="self.model.model.layers.25.self_attn.qkv_proj.weight"> <dim>9216</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3436" name="self.model.model.layers.25.self_attn.qkv_proj.weight" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>9216</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>9216</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3437" name="__module.model.model.layers.25.self_attn.qkv_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>9216</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="4410,qkv.51"> <dim>-1</dim> <dim>-1</dim> <dim>9216</dim> </port> </output> </layer> <layer id="3438" name="Constant_25306" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="2" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3439" name="Constant_25308" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635432" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3440" name="Constant_25310" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3441" name="__module.model.model.layers.25.self_attn/aten::slice/Slice" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>9216</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="4411,query_states.51"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3442" name="Constant_96688" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="56635456" size="32" /> <rt_info> <attribute name="precise" version="0" /> </rt_info> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="3443" name="__module.model.model.layers.25.self_attn/aten::view/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="4415"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> </output> </layer> <layer id="3444" name="__module.model.model.layers.25.self_attn/aten::transpose/Constant" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="56635488" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="3445" name="__module.model.model.layers.25.self_attn/aten::transpose/Transpose" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="4416,q.51"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="3446" name="__module.model.model.layers.25.self_attn/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="4465"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="3447" name="Constant_25873" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635630" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3448" name="Constant_25875" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635638" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3449" name="Constant_25877" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3450" name="__module.model.model.layers.25.self_attn/aten::slice/Slice_1" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="4475,x2.101"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="3451" name="Constant_90288_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1, 1" offset="56635654" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3452" name="Constant_90288" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3453" name="__module.model.model.layers.25.self_attn/aten::neg/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="4476"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="3454" name="Constant_25770" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="2" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3455" name="Constant_25814" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635630" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3456" name="Constant_25816" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3457" name="__module.model.model.layers.25.self_attn/aten::slice/Slice_2" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="4470"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="3458" name="__module.model.model.layers.25.self_attn/aten::cat/Concat" type="Concat" version="opset1"> <data axis="-1" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </input> <output> <port id="2" precision="FP32" names="4478"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="3459" name="__module.model.model.layers.25.self_attn/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="4479"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="3460" name="__module.model.model.layers.25.self_attn/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="4480"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="3461" name="Constant_102818_compressed" type="Const" version="opset1"> <data element_type="f16" shape="" offset="0" size="2" /> <output> <port id="0" precision="FP16" /> </output> </layer> <layer id="3462" name="Constant_102818" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16" /> </input> <output> <port id="1" precision="FP32" /> </output> </layer> <layer id="3463" name="Constant_102811" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="10" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3464" name="Constant_102813" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="2" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3465" name="Constant_102815" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="18" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3466" name="Concat_102816" type="Concat" version="opset1"> <data axis="0" /> <input> <port id="0" precision="I64"> <dim>1</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="4" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="3467" name="Broadcast_102819" type="Broadcast" version="opset3"> <data mode="numpy" /> <input> <port id="0" precision="FP32" /> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>0</dim> <dim>96</dim> </port> </output> </layer> <layer id="3468" name="ReadValue_101119" type="ReadValue" version="opset6"> <data variable_id="past_key_values.25.keypresent.25.key" variable_type="f32" variable_shape="?,32,?,96" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>0</dim> <dim>96</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.25.key"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="3469" name="Constant_100001" type="Const" version="opset1"> <data element_type="i64" shape="" offset="2" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="3470" name="Gather_100002" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="3471" name="Constant_25316" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635432" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3472" name="Constant_25318" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635656" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3473" name="Constant_25320" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3474" name="__module.model.model.layers.25.self_attn/aten::slice/Slice_3" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>9216</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="4412,key_states.105"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3475" name="Constant_96689" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="56635456" size="32" /> <rt_info> <attribute name="precise" version="0" /> </rt_info> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="3476" name="__module.model.model.layers.25.self_attn/aten::view/Reshape_1" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="4418"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> </output> </layer> <layer id="3477" name="__module.model.model.layers.25.self_attn/aten::transpose/Constant_1" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="56635488" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="3478" name="__module.model.model.layers.25.self_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="4419,key_states.107"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="3479" name="__module.model.model.layers.25.self_attn/aten::mul/Multiply_2" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="4481"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="3480" name="Constant_26016" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635630" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3481" name="Constant_26018" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635638" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3482" name="Constant_26020" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3483" name="__module.model.model.layers.25.self_attn/aten::slice/Slice_4" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="4491,x2.103"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="3484" name="Constant_90289_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1, 1" offset="56635654" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3485" name="Constant_90289" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3486" name="__module.model.model.layers.25.self_attn/aten::neg/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="4492"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="3487" name="Constant_25913" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="2" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3488" name="Constant_25957" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635630" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3489" name="Constant_25959" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3490" name="__module.model.model.layers.25.self_attn/aten::slice/Slice_5" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="4486"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="3491" name="__module.model.model.layers.25.self_attn/aten::cat/Concat_1" type="Concat" version="opset1"> <data axis="-1" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </input> <output> <port id="2" precision="FP32" names="4494"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="3492" name="__module.model.model.layers.25.self_attn/aten::mul/Multiply_3" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="4495"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="3493" name="__module.model.model.layers.25.self_attn/aten::add/Add_1" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="4496"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="3494" name="__module.model.model.layers.25.self_attn/aten::cat/Concat_2" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="hidden_states.609,present.25.key"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="3495" name="Constant_102806_compressed" type="Const" version="opset1"> <data element_type="f16" shape="" offset="0" size="2" /> <output> <port id="0" precision="FP16" /> </output> </layer> <layer id="3496" name="Constant_102806" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16" /> </input> <output> <port id="1" precision="FP32" /> </output> </layer> <layer id="3497" name="Constant_102799" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="10" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3498" name="Constant_102801" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="2" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3499" name="Constant_102803" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="18" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3500" name="Concat_102804" type="Concat" version="opset1"> <data axis="0" /> <input> <port id="0" precision="I64"> <dim>1</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="4" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="3501" name="Broadcast_102807" type="Broadcast" version="opset3"> <data mode="numpy" /> <input> <port id="0" precision="FP32" /> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>0</dim> <dim>96</dim> </port> </output> </layer> <layer id="3502" name="ReadValue_101121" type="ReadValue" version="opset6"> <data variable_id="past_key_values.25.valuepresent.25.value" variable_type="f32" variable_shape="?,32,?,96" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>0</dim> <dim>96</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.25.value"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="3503" name="Constant_100004" type="Const" version="opset1"> <data element_type="i64" shape="" offset="2" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="3504" name="Gather_100005" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="3505" name="Constant_25326" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635656" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3506" name="Constant_25328" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635638" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3507" name="Constant_25330" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3508" name="__module.model.model.layers.25.self_attn/aten::slice/Slice_6" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>9216</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="4413,value_states.51"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3509" name="Constant_96690" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="56635456" size="32" /> <rt_info> <attribute name="precise" version="0" /> </rt_info> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="3510" name="__module.model.model.layers.25.self_attn/aten::view/Reshape_2" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="4421"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> </output> </layer> <layer id="3511" name="__module.model.model.layers.25.self_attn/aten::transpose/Constant_2" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="56635488" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="3512" name="__module.model.model.layers.25.self_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="4422"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="3513" name="__module.model.model.layers.25.self_attn/aten::cat/Concat_3" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="hidden_states.611,present.25.value"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="3514" name="__module.model.model.layers.25.self_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> <data causal="false" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="2" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="3" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>-1</dim> </port> </input> <output> <port id="4" precision="FP32" names="4506,attn_output.101"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="3515" name="__module.model.model.layers.25.self_attn/aten::transpose/Constant_3" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="56635488" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="3516" name="__module.model.model.layers.25.self_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="4507"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> </output> </layer> <layer id="3517" name="Constant_96691" type="Const" version="opset1"> <data element_type="i64" shape="3" offset="56635704" size="24" /> <rt_info> <attribute name="precise" version="0" /> </rt_info> <output> <port id="0" precision="I64"> <dim>3</dim> </port> </output> </layer> <layer id="3518" name="__module.model.model.layers.25.self_attn/aten::view/Reshape_3" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> <port id="1" precision="I64"> <dim>3</dim> </port> </input> <output> <port id="2" precision="FP32" names="4510"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3519" name="self.model.model.layers.25.self_attn.o_proj.weight_compressed" type="Const" version="opset1"> <data element_type="f16" shape="3072, 3072" offset="5719253332" size="18874368" /> <output> <port id="0" precision="FP16" names="self.model.model.layers.25.self_attn.o_proj.weight"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3520" name="self.model.model.layers.25.self_attn.o_proj.weight" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3521" name="__module.model.model.layers.25.self_attn.o_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="4512,4514,input.151"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3522" name="__module.model.model.layers.25/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="4518,4520,4531,hidden_states.613,hidden_states.615"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3523" name="Constant_90293_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 3072" offset="5738127700" size="6144" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3524" name="Constant_90293" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3525" name="Constant_90292_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12314" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3526" name="Constant_90292" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3527" name="Constant_90290_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12316" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3528" name="Constant_90290" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3529" name="__module.model.model.layers.25.post_attention_layernorm/aten::pow/Power" type="Power" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="4521"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3530" name="Constant_26188" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="12318" size="8" /> <output> <port id="0" precision="I64" names="4522"> <dim>1</dim> </port> </output> </layer> <layer id="3531" name="__module.model.model.layers.25.post_attention_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> <data keep_dims="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="4523,variance.103"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3532" name="Constant_90291_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12326" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3533" name="Constant_90291" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3534" name="__module.model.model.layers.25.post_attention_layernorm/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="4524"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3535" name="__module.model.model.layers.25.post_attention_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3536" name="__module.model.model.layers.25.post_attention_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> <data auto_broadcast="numpy" m_pythondiv="true" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="4525"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3537" name="__module.model.model.layers.25.post_attention_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="4526,4527,hidden_states.617,hidden_states.619"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3538" name="__module.model.model.layers.25.post_attention_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="4528,4530"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3539" name="self.model.model.layers.25.mlp.gate_up_proj.weight_compressed" type="Const" version="opset1"> <data element_type="f16" shape="16384, 3072" offset="5738133844" size="100663296" /> <output> <port id="0" precision="FP16" names="self.model.model.layers.25.mlp.gate_up_proj.weight"> <dim>16384</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3540" name="self.model.model.layers.25.mlp.gate_up_proj.weight" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>16384</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>16384</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3541" name="__module.model.model.layers.25.mlp.gate_up_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>16384</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="4535,up_states.101"> <dim>-1</dim> <dim>-1</dim> <dim>16384</dim> </port> </output> </layer> <layer id="3542" name="__module.model.model.layers.25.mlp/prim::ListUnpack/VariadicSplit" type="VariadicSplit" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16384</dim> </port> <port id="1" precision="I64" /> <port id="2" precision="I32"> <dim>2</dim> </port> </input> <output> <port id="3" precision="FP32" names="4537,input.153"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> <port id="4" precision="FP32" names="4538,up_states.103"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> </output> </layer> <layer id="3543" name="__module.model.model.layers.25.mlp.activation_fn/aten::silu/Swish" type="Swish" version="opset4"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> </input> <output> <port id="1" precision="FP32" names="4539"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> </output> </layer> <layer id="3544" name="__module.model.model.layers.25.mlp/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> </input> <output> <port id="2" precision="FP32" names="4540"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> </output> </layer> <layer id="3545" name="self.model.model.layers.25.mlp.down_proj.weight_compressed" type="Const" version="opset1"> <data element_type="f16" shape="3072, 8192" offset="5838797140" size="50331648" /> <output> <port id="0" precision="FP16" names="self.model.model.layers.25.mlp.down_proj.weight"> <dim>3072</dim> <dim>8192</dim> </port> </output> </layer> <layer id="3546" name="self.model.model.layers.25.mlp.down_proj.weight" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>8192</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>3072</dim> <dim>8192</dim> </port> </output> </layer> <layer id="3547" name="__module.model.model.layers.25.mlp.down_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> <port id="1" precision="FP32"> <dim>3072</dim> <dim>8192</dim> </port> </input> <output> <port id="2" precision="FP32" names="4542,input.155"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3548" name="__module.model.model.layers.25/aten::add/Add_1" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="4544,4546,4554,4565,hidden_states.623,hidden_states.625"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3549" name="Constant_90297_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 3072" offset="5889128788" size="6144" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3550" name="Constant_90297" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3551" name="Constant_90296_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12314" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3552" name="Constant_90296" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3553" name="Constant_90294_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12316" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3554" name="Constant_90294" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3555" name="__module.model.model.layers.26.input_layernorm/aten::pow/Power" type="Power" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="4555"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3556" name="Constant_26257" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="12318" size="8" /> <output> <port id="0" precision="I64" names="4556"> <dim>1</dim> </port> </output> </layer> <layer id="3557" name="__module.model.model.layers.26.input_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> <data keep_dims="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="4557,variance.105"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3558" name="Constant_90295_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12326" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3559" name="Constant_90295" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3560" name="__module.model.model.layers.26.input_layernorm/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="4558"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3561" name="__module.model.model.layers.26.input_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3562" name="__module.model.model.layers.26.input_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> <data auto_broadcast="numpy" m_pythondiv="true" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="4559"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3563" name="__module.model.model.layers.26.input_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="4560,4561,hidden_states.627,hidden_states.629"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3564" name="__module.model.model.layers.26.input_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="4562,4564,hidden_states.631"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3565" name="self.model.model.layers.26.self_attn.qkv_proj.weight_compressed" type="Const" version="opset1"> <data element_type="f16" shape="9216, 3072" offset="5889134932" size="56623104" /> <output> <port id="0" precision="FP16" names="self.model.model.layers.26.self_attn.qkv_proj.weight"> <dim>9216</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3566" name="self.model.model.layers.26.self_attn.qkv_proj.weight" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>9216</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>9216</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3567" name="__module.model.model.layers.26.self_attn.qkv_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>9216</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="4571,qkv.53"> <dim>-1</dim> <dim>-1</dim> <dim>9216</dim> </port> </output> </layer> <layer id="3568" name="Constant_26300" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="2" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3569" name="Constant_26302" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635432" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3570" name="Constant_26304" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3571" name="__module.model.model.layers.26.self_attn/aten::slice/Slice" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>9216</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="4572,query_states.53"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3572" name="Constant_96692" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="56635456" size="32" /> <rt_info> <attribute name="precise" version="0" /> </rt_info> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="3573" name="__module.model.model.layers.26.self_attn/aten::view/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="4576"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> </output> </layer> <layer id="3574" name="__module.model.model.layers.26.self_attn/aten::transpose/Constant" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="56635488" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="3575" name="__module.model.model.layers.26.self_attn/aten::transpose/Transpose" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="4577,q.53"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="3576" name="__module.model.model.layers.26.self_attn/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="4626"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="3577" name="Constant_26867" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635630" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3578" name="Constant_26869" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635638" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3579" name="Constant_26871" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3580" name="__module.model.model.layers.26.self_attn/aten::slice/Slice_1" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="4636,x2.105"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="3581" name="Constant_90298_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1, 1" offset="56635654" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3582" name="Constant_90298" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3583" name="__module.model.model.layers.26.self_attn/aten::neg/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="4637"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="3584" name="Constant_26764" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="2" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3585" name="Constant_26808" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635630" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3586" name="Constant_26810" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3587" name="__module.model.model.layers.26.self_attn/aten::slice/Slice_2" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="4631"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="3588" name="__module.model.model.layers.26.self_attn/aten::cat/Concat" type="Concat" version="opset1"> <data axis="-1" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </input> <output> <port id="2" precision="FP32" names="4639"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="3589" name="__module.model.model.layers.26.self_attn/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="4640"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="3590" name="__module.model.model.layers.26.self_attn/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="4641"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="3591" name="Constant_102842_compressed" type="Const" version="opset1"> <data element_type="f16" shape="" offset="0" size="2" /> <output> <port id="0" precision="FP16" /> </output> </layer> <layer id="3592" name="Constant_102842" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16" /> </input> <output> <port id="1" precision="FP32" /> </output> </layer> <layer id="3593" name="Constant_102835" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="10" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3594" name="Constant_102837" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="2" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3595" name="Constant_102839" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="18" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3596" name="Concat_102840" type="Concat" version="opset1"> <data axis="0" /> <input> <port id="0" precision="I64"> <dim>1</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="4" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="3597" name="Broadcast_102843" type="Broadcast" version="opset3"> <data mode="numpy" /> <input> <port id="0" precision="FP32" /> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>0</dim> <dim>96</dim> </port> </output> </layer> <layer id="3598" name="ReadValue_101123" type="ReadValue" version="opset6"> <data variable_id="past_key_values.26.keypresent.26.key" variable_type="f32" variable_shape="?,32,?,96" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>0</dim> <dim>96</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.26.key"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="3599" name="Constant_100007" type="Const" version="opset1"> <data element_type="i64" shape="" offset="2" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="3600" name="Gather_100008" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="3601" name="Constant_26310" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635432" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3602" name="Constant_26312" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635656" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3603" name="Constant_26314" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3604" name="__module.model.model.layers.26.self_attn/aten::slice/Slice_3" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>9216</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="4573,key_states.109"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3605" name="Constant_96693" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="56635456" size="32" /> <rt_info> <attribute name="precise" version="0" /> </rt_info> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="3606" name="__module.model.model.layers.26.self_attn/aten::view/Reshape_1" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="4579"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> </output> </layer> <layer id="3607" name="__module.model.model.layers.26.self_attn/aten::transpose/Constant_1" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="56635488" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="3608" name="__module.model.model.layers.26.self_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="4580,key_states.111"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="3609" name="__module.model.model.layers.26.self_attn/aten::mul/Multiply_2" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="4642"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="3610" name="Constant_27010" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635630" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3611" name="Constant_27012" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635638" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3612" name="Constant_27014" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3613" name="__module.model.model.layers.26.self_attn/aten::slice/Slice_4" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="4652,x2.107"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="3614" name="Constant_90299_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1, 1" offset="56635654" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3615" name="Constant_90299" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3616" name="__module.model.model.layers.26.self_attn/aten::neg/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="4653"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="3617" name="Constant_26907" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="2" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3618" name="Constant_26951" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635630" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3619" name="Constant_26953" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3620" name="__module.model.model.layers.26.self_attn/aten::slice/Slice_5" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="4647"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="3621" name="__module.model.model.layers.26.self_attn/aten::cat/Concat_1" type="Concat" version="opset1"> <data axis="-1" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </input> <output> <port id="2" precision="FP32" names="4655"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="3622" name="__module.model.model.layers.26.self_attn/aten::mul/Multiply_3" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="4656"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="3623" name="__module.model.model.layers.26.self_attn/aten::add/Add_1" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="4657"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="3624" name="__module.model.model.layers.26.self_attn/aten::cat/Concat_2" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="hidden_states.633,present.26.key"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="3625" name="Constant_102830_compressed" type="Const" version="opset1"> <data element_type="f16" shape="" offset="0" size="2" /> <output> <port id="0" precision="FP16" /> </output> </layer> <layer id="3626" name="Constant_102830" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16" /> </input> <output> <port id="1" precision="FP32" /> </output> </layer> <layer id="3627" name="Constant_102823" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="10" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3628" name="Constant_102825" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="2" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3629" name="Constant_102827" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="18" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3630" name="Concat_102828" type="Concat" version="opset1"> <data axis="0" /> <input> <port id="0" precision="I64"> <dim>1</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="4" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="3631" name="Broadcast_102831" type="Broadcast" version="opset3"> <data mode="numpy" /> <input> <port id="0" precision="FP32" /> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>0</dim> <dim>96</dim> </port> </output> </layer> <layer id="3632" name="ReadValue_101125" type="ReadValue" version="opset6"> <data variable_id="past_key_values.26.valuepresent.26.value" variable_type="f32" variable_shape="?,32,?,96" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>0</dim> <dim>96</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.26.value"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="3633" name="Constant_100010" type="Const" version="opset1"> <data element_type="i64" shape="" offset="2" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="3634" name="Gather_100011" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="3635" name="Constant_26320" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635656" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3636" name="Constant_26322" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635638" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3637" name="Constant_26324" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3638" name="__module.model.model.layers.26.self_attn/aten::slice/Slice_6" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>9216</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="4574,value_states.53"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3639" name="Constant_96694" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="56635456" size="32" /> <rt_info> <attribute name="precise" version="0" /> </rt_info> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="3640" name="__module.model.model.layers.26.self_attn/aten::view/Reshape_2" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="4582"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> </output> </layer> <layer id="3641" name="__module.model.model.layers.26.self_attn/aten::transpose/Constant_2" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="56635488" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="3642" name="__module.model.model.layers.26.self_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="4583"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="3643" name="__module.model.model.layers.26.self_attn/aten::cat/Concat_3" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="hidden_states.635,present.26.value"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="3644" name="__module.model.model.layers.26.self_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> <data causal="false" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="2" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="3" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>-1</dim> </port> </input> <output> <port id="4" precision="FP32" names="4667,attn_output.105"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="3645" name="__module.model.model.layers.26.self_attn/aten::transpose/Constant_3" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="56635488" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="3646" name="__module.model.model.layers.26.self_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="4668"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> </output> </layer> <layer id="3647" name="Constant_96695" type="Const" version="opset1"> <data element_type="i64" shape="3" offset="56635704" size="24" /> <rt_info> <attribute name="precise" version="0" /> </rt_info> <output> <port id="0" precision="I64"> <dim>3</dim> </port> </output> </layer> <layer id="3648" name="__module.model.model.layers.26.self_attn/aten::view/Reshape_3" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> <port id="1" precision="I64"> <dim>3</dim> </port> </input> <output> <port id="2" precision="FP32" names="4671"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3649" name="self.model.model.layers.26.self_attn.o_proj.weight_compressed" type="Const" version="opset1"> <data element_type="f16" shape="3072, 3072" offset="5945758036" size="18874368" /> <output> <port id="0" precision="FP16" names="self.model.model.layers.26.self_attn.o_proj.weight"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3650" name="self.model.model.layers.26.self_attn.o_proj.weight" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3651" name="__module.model.model.layers.26.self_attn.o_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="4673,4675,input.157"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3652" name="__module.model.model.layers.26/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="4679,4681,4692,hidden_states.637,hidden_states.639"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3653" name="Constant_90303_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 3072" offset="5964632404" size="6144" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3654" name="Constant_90303" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3655" name="Constant_90302_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12314" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3656" name="Constant_90302" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3657" name="Constant_90300_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12316" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3658" name="Constant_90300" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3659" name="__module.model.model.layers.26.post_attention_layernorm/aten::pow/Power" type="Power" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="4682"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3660" name="Constant_27182" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="12318" size="8" /> <output> <port id="0" precision="I64" names="4683"> <dim>1</dim> </port> </output> </layer> <layer id="3661" name="__module.model.model.layers.26.post_attention_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> <data keep_dims="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="4684,variance.107"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3662" name="Constant_90301_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12326" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3663" name="Constant_90301" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3664" name="__module.model.model.layers.26.post_attention_layernorm/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="4685"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3665" name="__module.model.model.layers.26.post_attention_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3666" name="__module.model.model.layers.26.post_attention_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> <data auto_broadcast="numpy" m_pythondiv="true" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="4686"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3667" name="__module.model.model.layers.26.post_attention_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="4687,4688,hidden_states.641,hidden_states.643"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3668" name="__module.model.model.layers.26.post_attention_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="4689,4691"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3669" name="self.model.model.layers.26.mlp.gate_up_proj.weight_compressed" type="Const" version="opset1"> <data element_type="f16" shape="16384, 3072" offset="5964638548" size="100663296" /> <output> <port id="0" precision="FP16" names="self.model.model.layers.26.mlp.gate_up_proj.weight"> <dim>16384</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3670" name="self.model.model.layers.26.mlp.gate_up_proj.weight" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>16384</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>16384</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3671" name="__module.model.model.layers.26.mlp.gate_up_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>16384</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="4696,up_states.105"> <dim>-1</dim> <dim>-1</dim> <dim>16384</dim> </port> </output> </layer> <layer id="3672" name="__module.model.model.layers.26.mlp/prim::ListUnpack/VariadicSplit" type="VariadicSplit" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16384</dim> </port> <port id="1" precision="I64" /> <port id="2" precision="I32"> <dim>2</dim> </port> </input> <output> <port id="3" precision="FP32" names="4698,input.159"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> <port id="4" precision="FP32" names="4699,up_states.107"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> </output> </layer> <layer id="3673" name="__module.model.model.layers.26.mlp.activation_fn/aten::silu/Swish" type="Swish" version="opset4"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> </input> <output> <port id="1" precision="FP32" names="4700"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> </output> </layer> <layer id="3674" name="__module.model.model.layers.26.mlp/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> </input> <output> <port id="2" precision="FP32" names="4701"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> </output> </layer> <layer id="3675" name="self.model.model.layers.26.mlp.down_proj.weight_compressed" type="Const" version="opset1"> <data element_type="f16" shape="3072, 8192" offset="6065301844" size="50331648" /> <output> <port id="0" precision="FP16" names="self.model.model.layers.26.mlp.down_proj.weight"> <dim>3072</dim> <dim>8192</dim> </port> </output> </layer> <layer id="3676" name="self.model.model.layers.26.mlp.down_proj.weight" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>8192</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>3072</dim> <dim>8192</dim> </port> </output> </layer> <layer id="3677" name="__module.model.model.layers.26.mlp.down_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> <port id="1" precision="FP32"> <dim>3072</dim> <dim>8192</dim> </port> </input> <output> <port id="2" precision="FP32" names="4703,input.161"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3678" name="__module.model.model.layers.26/aten::add/Add_1" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="4705,4707,4715,4726,hidden_states.647,hidden_states.649"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3679" name="Constant_90307_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 3072" offset="6115633492" size="6144" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3680" name="Constant_90307" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3681" name="Constant_90306_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12314" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3682" name="Constant_90306" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3683" name="Constant_90304_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12316" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3684" name="Constant_90304" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3685" name="__module.model.model.layers.27.input_layernorm/aten::pow/Power" type="Power" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="4716"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3686" name="Constant_27251" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="12318" size="8" /> <output> <port id="0" precision="I64" names="4717"> <dim>1</dim> </port> </output> </layer> <layer id="3687" name="__module.model.model.layers.27.input_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> <data keep_dims="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="4718,variance.109"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3688" name="Constant_90305_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12326" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3689" name="Constant_90305" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3690" name="__module.model.model.layers.27.input_layernorm/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="4719"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3691" name="__module.model.model.layers.27.input_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3692" name="__module.model.model.layers.27.input_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> <data auto_broadcast="numpy" m_pythondiv="true" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="4720"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3693" name="__module.model.model.layers.27.input_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="4721,4722,hidden_states.651,hidden_states.653"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3694" name="__module.model.model.layers.27.input_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="4723,4725,hidden_states.655"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3695" name="self.model.model.layers.27.self_attn.qkv_proj.weight_compressed" type="Const" version="opset1"> <data element_type="f16" shape="9216, 3072" offset="6115639636" size="56623104" /> <output> <port id="0" precision="FP16" names="self.model.model.layers.27.self_attn.qkv_proj.weight"> <dim>9216</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3696" name="self.model.model.layers.27.self_attn.qkv_proj.weight" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>9216</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>9216</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3697" name="__module.model.model.layers.27.self_attn.qkv_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>9216</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="4732,qkv.55"> <dim>-1</dim> <dim>-1</dim> <dim>9216</dim> </port> </output> </layer> <layer id="3698" name="Constant_27294" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="2" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3699" name="Constant_27296" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635432" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3700" name="Constant_27298" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3701" name="__module.model.model.layers.27.self_attn/aten::slice/Slice" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>9216</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="4733,query_states.55"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3702" name="Constant_96696" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="56635456" size="32" /> <rt_info> <attribute name="precise" version="0" /> </rt_info> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="3703" name="__module.model.model.layers.27.self_attn/aten::view/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="4737"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> </output> </layer> <layer id="3704" name="__module.model.model.layers.27.self_attn/aten::transpose/Constant" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="56635488" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="3705" name="__module.model.model.layers.27.self_attn/aten::transpose/Transpose" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="4738,q.55"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="3706" name="__module.model.model.layers.27.self_attn/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="4787"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="3707" name="Constant_27861" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635630" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3708" name="Constant_27863" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635638" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3709" name="Constant_27865" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3710" name="__module.model.model.layers.27.self_attn/aten::slice/Slice_1" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="4797,x2.109"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="3711" name="Constant_90308_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1, 1" offset="56635654" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3712" name="Constant_90308" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3713" name="__module.model.model.layers.27.self_attn/aten::neg/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="4798"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="3714" name="Constant_27758" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="2" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3715" name="Constant_27802" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635630" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3716" name="Constant_27804" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3717" name="__module.model.model.layers.27.self_attn/aten::slice/Slice_2" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="4792"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="3718" name="__module.model.model.layers.27.self_attn/aten::cat/Concat" type="Concat" version="opset1"> <data axis="-1" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </input> <output> <port id="2" precision="FP32" names="4800"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="3719" name="__module.model.model.layers.27.self_attn/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="4801"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="3720" name="__module.model.model.layers.27.self_attn/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="4802"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="3721" name="Constant_102866_compressed" type="Const" version="opset1"> <data element_type="f16" shape="" offset="0" size="2" /> <output> <port id="0" precision="FP16" /> </output> </layer> <layer id="3722" name="Constant_102866" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16" /> </input> <output> <port id="1" precision="FP32" /> </output> </layer> <layer id="3723" name="Constant_102859" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="10" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3724" name="Constant_102861" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="2" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3725" name="Constant_102863" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="18" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3726" name="Concat_102864" type="Concat" version="opset1"> <data axis="0" /> <input> <port id="0" precision="I64"> <dim>1</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="4" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="3727" name="Broadcast_102867" type="Broadcast" version="opset3"> <data mode="numpy" /> <input> <port id="0" precision="FP32" /> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>0</dim> <dim>96</dim> </port> </output> </layer> <layer id="3728" name="ReadValue_101127" type="ReadValue" version="opset6"> <data variable_id="past_key_values.27.keypresent.27.key" variable_type="f32" variable_shape="?,32,?,96" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>0</dim> <dim>96</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.27.key"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="3729" name="Constant_100013" type="Const" version="opset1"> <data element_type="i64" shape="" offset="2" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="3730" name="Gather_100014" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="3731" name="Constant_27304" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635432" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3732" name="Constant_27306" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635656" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3733" name="Constant_27308" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3734" name="__module.model.model.layers.27.self_attn/aten::slice/Slice_3" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>9216</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="4734,key_states.113"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3735" name="Constant_96697" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="56635456" size="32" /> <rt_info> <attribute name="precise" version="0" /> </rt_info> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="3736" name="__module.model.model.layers.27.self_attn/aten::view/Reshape_1" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="4740"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> </output> </layer> <layer id="3737" name="__module.model.model.layers.27.self_attn/aten::transpose/Constant_1" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="56635488" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="3738" name="__module.model.model.layers.27.self_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="4741,key_states.115"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="3739" name="__module.model.model.layers.27.self_attn/aten::mul/Multiply_2" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="4803"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="3740" name="Constant_28004" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635630" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3741" name="Constant_28006" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635638" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3742" name="Constant_28008" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3743" name="__module.model.model.layers.27.self_attn/aten::slice/Slice_4" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="4813,x2.111"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="3744" name="Constant_90309_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1, 1" offset="56635654" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3745" name="Constant_90309" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3746" name="__module.model.model.layers.27.self_attn/aten::neg/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="4814"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="3747" name="Constant_27901" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="2" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3748" name="Constant_27945" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635630" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3749" name="Constant_27947" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3750" name="__module.model.model.layers.27.self_attn/aten::slice/Slice_5" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="4808"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="3751" name="__module.model.model.layers.27.self_attn/aten::cat/Concat_1" type="Concat" version="opset1"> <data axis="-1" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </input> <output> <port id="2" precision="FP32" names="4816"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="3752" name="__module.model.model.layers.27.self_attn/aten::mul/Multiply_3" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="4817"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="3753" name="__module.model.model.layers.27.self_attn/aten::add/Add_1" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="4818"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="3754" name="__module.model.model.layers.27.self_attn/aten::cat/Concat_2" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="hidden_states.657,present.27.key"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="3755" name="Constant_102854_compressed" type="Const" version="opset1"> <data element_type="f16" shape="" offset="0" size="2" /> <output> <port id="0" precision="FP16" /> </output> </layer> <layer id="3756" name="Constant_102854" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16" /> </input> <output> <port id="1" precision="FP32" /> </output> </layer> <layer id="3757" name="Constant_102847" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="10" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3758" name="Constant_102849" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="2" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3759" name="Constant_102851" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="18" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3760" name="Concat_102852" type="Concat" version="opset1"> <data axis="0" /> <input> <port id="0" precision="I64"> <dim>1</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="4" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="3761" name="Broadcast_102855" type="Broadcast" version="opset3"> <data mode="numpy" /> <input> <port id="0" precision="FP32" /> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>0</dim> <dim>96</dim> </port> </output> </layer> <layer id="3762" name="ReadValue_101129" type="ReadValue" version="opset6"> <data variable_id="past_key_values.27.valuepresent.27.value" variable_type="f32" variable_shape="?,32,?,96" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>0</dim> <dim>96</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.27.value"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="3763" name="Constant_100016" type="Const" version="opset1"> <data element_type="i64" shape="" offset="2" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="3764" name="Gather_100017" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="3765" name="Constant_27314" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635656" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3766" name="Constant_27316" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635638" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3767" name="Constant_27318" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3768" name="__module.model.model.layers.27.self_attn/aten::slice/Slice_6" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>9216</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="4735,value_states.55"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3769" name="Constant_96698" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="56635456" size="32" /> <rt_info> <attribute name="precise" version="0" /> </rt_info> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="3770" name="__module.model.model.layers.27.self_attn/aten::view/Reshape_2" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="4743"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> </output> </layer> <layer id="3771" name="__module.model.model.layers.27.self_attn/aten::transpose/Constant_2" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="56635488" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="3772" name="__module.model.model.layers.27.self_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="4744"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="3773" name="__module.model.model.layers.27.self_attn/aten::cat/Concat_3" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="hidden_states.659,present.27.value"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="3774" name="__module.model.model.layers.27.self_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> <data causal="false" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="2" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="3" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>-1</dim> </port> </input> <output> <port id="4" precision="FP32" names="4828,attn_output.109"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="3775" name="__module.model.model.layers.27.self_attn/aten::transpose/Constant_3" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="56635488" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="3776" name="__module.model.model.layers.27.self_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="4829"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> </output> </layer> <layer id="3777" name="Constant_96699" type="Const" version="opset1"> <data element_type="i64" shape="3" offset="56635704" size="24" /> <rt_info> <attribute name="precise" version="0" /> </rt_info> <output> <port id="0" precision="I64"> <dim>3</dim> </port> </output> </layer> <layer id="3778" name="__module.model.model.layers.27.self_attn/aten::view/Reshape_3" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> <port id="1" precision="I64"> <dim>3</dim> </port> </input> <output> <port id="2" precision="FP32" names="4832"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3779" name="self.model.model.layers.27.self_attn.o_proj.weight_compressed" type="Const" version="opset1"> <data element_type="f16" shape="3072, 3072" offset="6172262740" size="18874368" /> <output> <port id="0" precision="FP16" names="self.model.model.layers.27.self_attn.o_proj.weight"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3780" name="self.model.model.layers.27.self_attn.o_proj.weight" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3781" name="__module.model.model.layers.27.self_attn.o_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="4834,4836,input.163"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3782" name="__module.model.model.layers.27/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="4840,4842,4853,hidden_states.661,hidden_states.663"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3783" name="Constant_90313_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 3072" offset="6191137108" size="6144" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3784" name="Constant_90313" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3785" name="Constant_90312_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12314" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3786" name="Constant_90312" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3787" name="Constant_90310_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12316" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3788" name="Constant_90310" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3789" name="__module.model.model.layers.27.post_attention_layernorm/aten::pow/Power" type="Power" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="4843"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3790" name="Constant_28176" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="12318" size="8" /> <output> <port id="0" precision="I64" names="4844"> <dim>1</dim> </port> </output> </layer> <layer id="3791" name="__module.model.model.layers.27.post_attention_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> <data keep_dims="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="4845,variance.111"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3792" name="Constant_90311_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12326" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3793" name="Constant_90311" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3794" name="__module.model.model.layers.27.post_attention_layernorm/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="4846"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3795" name="__module.model.model.layers.27.post_attention_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3796" name="__module.model.model.layers.27.post_attention_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> <data auto_broadcast="numpy" m_pythondiv="true" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="4847"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3797" name="__module.model.model.layers.27.post_attention_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="4848,4849,hidden_states.665,hidden_states.667"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3798" name="__module.model.model.layers.27.post_attention_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="4850,4852"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3799" name="self.model.model.layers.27.mlp.gate_up_proj.weight_compressed" type="Const" version="opset1"> <data element_type="f16" shape="16384, 3072" offset="6191143252" size="100663296" /> <output> <port id="0" precision="FP16" names="self.model.model.layers.27.mlp.gate_up_proj.weight"> <dim>16384</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3800" name="self.model.model.layers.27.mlp.gate_up_proj.weight" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>16384</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>16384</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3801" name="__module.model.model.layers.27.mlp.gate_up_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>16384</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="4857,up_states.109"> <dim>-1</dim> <dim>-1</dim> <dim>16384</dim> </port> </output> </layer> <layer id="3802" name="__module.model.model.layers.27.mlp/prim::ListUnpack/VariadicSplit" type="VariadicSplit" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16384</dim> </port> <port id="1" precision="I64" /> <port id="2" precision="I32"> <dim>2</dim> </port> </input> <output> <port id="3" precision="FP32" names="4859,input.165"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> <port id="4" precision="FP32" names="4860,up_states.111"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> </output> </layer> <layer id="3803" name="__module.model.model.layers.27.mlp.activation_fn/aten::silu/Swish" type="Swish" version="opset4"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> </input> <output> <port id="1" precision="FP32" names="4861"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> </output> </layer> <layer id="3804" name="__module.model.model.layers.27.mlp/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> </input> <output> <port id="2" precision="FP32" names="4862"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> </output> </layer> <layer id="3805" name="self.model.model.layers.27.mlp.down_proj.weight_compressed" type="Const" version="opset1"> <data element_type="f16" shape="3072, 8192" offset="6291806548" size="50331648" /> <output> <port id="0" precision="FP16" names="self.model.model.layers.27.mlp.down_proj.weight"> <dim>3072</dim> <dim>8192</dim> </port> </output> </layer> <layer id="3806" name="self.model.model.layers.27.mlp.down_proj.weight" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>8192</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>3072</dim> <dim>8192</dim> </port> </output> </layer> <layer id="3807" name="__module.model.model.layers.27.mlp.down_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> <port id="1" precision="FP32"> <dim>3072</dim> <dim>8192</dim> </port> </input> <output> <port id="2" precision="FP32" names="4864,input.167"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3808" name="__module.model.model.layers.27/aten::add/Add_1" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="4866,4868,4876,4887,hidden_states.671,hidden_states.673"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3809" name="Constant_90317_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 3072" offset="6342138196" size="6144" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3810" name="Constant_90317" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3811" name="Constant_90316_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12314" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3812" name="Constant_90316" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3813" name="Constant_90314_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12316" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3814" name="Constant_90314" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3815" name="__module.model.model.layers.28.input_layernorm/aten::pow/Power" type="Power" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="4877"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3816" name="Constant_28245" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="12318" size="8" /> <output> <port id="0" precision="I64" names="4878"> <dim>1</dim> </port> </output> </layer> <layer id="3817" name="__module.model.model.layers.28.input_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> <data keep_dims="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="4879,variance.113"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3818" name="Constant_90315_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12326" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3819" name="Constant_90315" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3820" name="__module.model.model.layers.28.input_layernorm/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="4880"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3821" name="__module.model.model.layers.28.input_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3822" name="__module.model.model.layers.28.input_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> <data auto_broadcast="numpy" m_pythondiv="true" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="4881"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3823" name="__module.model.model.layers.28.input_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="4882,4883,hidden_states.675,hidden_states.677"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3824" name="__module.model.model.layers.28.input_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="4884,4886,hidden_states.679"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3825" name="self.model.model.layers.28.self_attn.qkv_proj.weight_compressed" type="Const" version="opset1"> <data element_type="f16" shape="9216, 3072" offset="6342144340" size="56623104" /> <output> <port id="0" precision="FP16" names="self.model.model.layers.28.self_attn.qkv_proj.weight"> <dim>9216</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3826" name="self.model.model.layers.28.self_attn.qkv_proj.weight" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>9216</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>9216</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3827" name="__module.model.model.layers.28.self_attn.qkv_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>9216</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="4893,qkv.57"> <dim>-1</dim> <dim>-1</dim> <dim>9216</dim> </port> </output> </layer> <layer id="3828" name="Constant_28288" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="2" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3829" name="Constant_28290" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635432" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3830" name="Constant_28292" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3831" name="__module.model.model.layers.28.self_attn/aten::slice/Slice" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>9216</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="4894,query_states.57"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3832" name="Constant_96700" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="56635456" size="32" /> <rt_info> <attribute name="precise" version="0" /> </rt_info> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="3833" name="__module.model.model.layers.28.self_attn/aten::view/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="4898"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> </output> </layer> <layer id="3834" name="__module.model.model.layers.28.self_attn/aten::transpose/Constant" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="56635488" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="3835" name="__module.model.model.layers.28.self_attn/aten::transpose/Transpose" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="4899,q.57"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="3836" name="__module.model.model.layers.28.self_attn/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="4948"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="3837" name="Constant_28855" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635630" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3838" name="Constant_28857" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635638" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3839" name="Constant_28859" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3840" name="__module.model.model.layers.28.self_attn/aten::slice/Slice_1" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="4958,x2.113"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="3841" name="Constant_90318_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1, 1" offset="56635654" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3842" name="Constant_90318" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3843" name="__module.model.model.layers.28.self_attn/aten::neg/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="4959"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="3844" name="Constant_28752" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="2" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3845" name="Constant_28796" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635630" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3846" name="Constant_28798" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3847" name="__module.model.model.layers.28.self_attn/aten::slice/Slice_2" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="4953"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="3848" name="__module.model.model.layers.28.self_attn/aten::cat/Concat" type="Concat" version="opset1"> <data axis="-1" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </input> <output> <port id="2" precision="FP32" names="4961"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="3849" name="__module.model.model.layers.28.self_attn/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="4962"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="3850" name="__module.model.model.layers.28.self_attn/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="4963"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="3851" name="Constant_102890_compressed" type="Const" version="opset1"> <data element_type="f16" shape="" offset="0" size="2" /> <output> <port id="0" precision="FP16" /> </output> </layer> <layer id="3852" name="Constant_102890" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16" /> </input> <output> <port id="1" precision="FP32" /> </output> </layer> <layer id="3853" name="Constant_102883" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="10" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3854" name="Constant_102885" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="2" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3855" name="Constant_102887" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="18" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3856" name="Concat_102888" type="Concat" version="opset1"> <data axis="0" /> <input> <port id="0" precision="I64"> <dim>1</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="4" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="3857" name="Broadcast_102891" type="Broadcast" version="opset3"> <data mode="numpy" /> <input> <port id="0" precision="FP32" /> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>0</dim> <dim>96</dim> </port> </output> </layer> <layer id="3858" name="ReadValue_101131" type="ReadValue" version="opset6"> <data variable_id="past_key_values.28.keypresent.28.key" variable_type="f32" variable_shape="?,32,?,96" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>0</dim> <dim>96</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.28.key"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="3859" name="Constant_100019" type="Const" version="opset1"> <data element_type="i64" shape="" offset="2" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="3860" name="Gather_100020" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="3861" name="Constant_28298" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635432" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3862" name="Constant_28300" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635656" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3863" name="Constant_28302" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3864" name="__module.model.model.layers.28.self_attn/aten::slice/Slice_3" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>9216</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="4895,key_states.117"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3865" name="Constant_96701" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="56635456" size="32" /> <rt_info> <attribute name="precise" version="0" /> </rt_info> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="3866" name="__module.model.model.layers.28.self_attn/aten::view/Reshape_1" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="4901"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> </output> </layer> <layer id="3867" name="__module.model.model.layers.28.self_attn/aten::transpose/Constant_1" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="56635488" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="3868" name="__module.model.model.layers.28.self_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="4902,key_states.119"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="3869" name="__module.model.model.layers.28.self_attn/aten::mul/Multiply_2" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="4964"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="3870" name="Constant_28998" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635630" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3871" name="Constant_29000" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635638" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3872" name="Constant_29002" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3873" name="__module.model.model.layers.28.self_attn/aten::slice/Slice_4" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="4974,x2.115"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="3874" name="Constant_90319_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1, 1" offset="56635654" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3875" name="Constant_90319" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3876" name="__module.model.model.layers.28.self_attn/aten::neg/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="4975"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="3877" name="Constant_28895" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="2" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3878" name="Constant_28939" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635630" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3879" name="Constant_28941" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3880" name="__module.model.model.layers.28.self_attn/aten::slice/Slice_5" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="4969"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="3881" name="__module.model.model.layers.28.self_attn/aten::cat/Concat_1" type="Concat" version="opset1"> <data axis="-1" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </input> <output> <port id="2" precision="FP32" names="4977"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="3882" name="__module.model.model.layers.28.self_attn/aten::mul/Multiply_3" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="4978"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="3883" name="__module.model.model.layers.28.self_attn/aten::add/Add_1" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="4979"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="3884" name="__module.model.model.layers.28.self_attn/aten::cat/Concat_2" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="hidden_states.681,present.28.key"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="3885" name="Constant_102878_compressed" type="Const" version="opset1"> <data element_type="f16" shape="" offset="0" size="2" /> <output> <port id="0" precision="FP16" /> </output> </layer> <layer id="3886" name="Constant_102878" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16" /> </input> <output> <port id="1" precision="FP32" /> </output> </layer> <layer id="3887" name="Constant_102871" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="10" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3888" name="Constant_102873" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="2" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3889" name="Constant_102875" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="18" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3890" name="Concat_102876" type="Concat" version="opset1"> <data axis="0" /> <input> <port id="0" precision="I64"> <dim>1</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="4" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="3891" name="Broadcast_102879" type="Broadcast" version="opset3"> <data mode="numpy" /> <input> <port id="0" precision="FP32" /> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>0</dim> <dim>96</dim> </port> </output> </layer> <layer id="3892" name="ReadValue_101133" type="ReadValue" version="opset6"> <data variable_id="past_key_values.28.valuepresent.28.value" variable_type="f32" variable_shape="?,32,?,96" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>0</dim> <dim>96</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.28.value"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="3893" name="Constant_100022" type="Const" version="opset1"> <data element_type="i64" shape="" offset="2" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="3894" name="Gather_100023" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="3895" name="Constant_28308" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635656" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3896" name="Constant_28310" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635638" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3897" name="Constant_28312" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3898" name="__module.model.model.layers.28.self_attn/aten::slice/Slice_6" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>9216</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="4896,value_states.57"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3899" name="Constant_96702" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="56635456" size="32" /> <rt_info> <attribute name="precise" version="0" /> </rt_info> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="3900" name="__module.model.model.layers.28.self_attn/aten::view/Reshape_2" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="4904"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> </output> </layer> <layer id="3901" name="__module.model.model.layers.28.self_attn/aten::transpose/Constant_2" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="56635488" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="3902" name="__module.model.model.layers.28.self_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="4905"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="3903" name="__module.model.model.layers.28.self_attn/aten::cat/Concat_3" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="hidden_states.683,present.28.value"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="3904" name="__module.model.model.layers.28.self_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> <data causal="false" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="2" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="3" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>-1</dim> </port> </input> <output> <port id="4" precision="FP32" names="4989,attn_output.113"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="3905" name="__module.model.model.layers.28.self_attn/aten::transpose/Constant_3" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="56635488" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="3906" name="__module.model.model.layers.28.self_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="4990"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> </output> </layer> <layer id="3907" name="Constant_96703" type="Const" version="opset1"> <data element_type="i64" shape="3" offset="56635704" size="24" /> <rt_info> <attribute name="precise" version="0" /> </rt_info> <output> <port id="0" precision="I64"> <dim>3</dim> </port> </output> </layer> <layer id="3908" name="__module.model.model.layers.28.self_attn/aten::view/Reshape_3" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> <port id="1" precision="I64"> <dim>3</dim> </port> </input> <output> <port id="2" precision="FP32" names="4993"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3909" name="self.model.model.layers.28.self_attn.o_proj.weight_compressed" type="Const" version="opset1"> <data element_type="f16" shape="3072, 3072" offset="6398767444" size="18874368" /> <output> <port id="0" precision="FP16" names="self.model.model.layers.28.self_attn.o_proj.weight"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3910" name="self.model.model.layers.28.self_attn.o_proj.weight" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3911" name="__module.model.model.layers.28.self_attn.o_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="4995,4997,input.169"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3912" name="__module.model.model.layers.28/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="5001,5003,5014,hidden_states.685,hidden_states.687"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3913" name="Constant_90323_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 3072" offset="6417641812" size="6144" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3914" name="Constant_90323" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3915" name="Constant_90322_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12314" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3916" name="Constant_90322" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3917" name="Constant_90320_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12316" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3918" name="Constant_90320" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3919" name="__module.model.model.layers.28.post_attention_layernorm/aten::pow/Power" type="Power" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="5004"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3920" name="Constant_29170" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="12318" size="8" /> <output> <port id="0" precision="I64" names="5005"> <dim>1</dim> </port> </output> </layer> <layer id="3921" name="__module.model.model.layers.28.post_attention_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> <data keep_dims="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="5006,variance.115"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3922" name="Constant_90321_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12326" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3923" name="Constant_90321" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3924" name="__module.model.model.layers.28.post_attention_layernorm/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="5007"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3925" name="__module.model.model.layers.28.post_attention_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3926" name="__module.model.model.layers.28.post_attention_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> <data auto_broadcast="numpy" m_pythondiv="true" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="5008"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3927" name="__module.model.model.layers.28.post_attention_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="5009,5010,hidden_states.689,hidden_states.691"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3928" name="__module.model.model.layers.28.post_attention_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="5011,5013"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3929" name="self.model.model.layers.28.mlp.gate_up_proj.weight_compressed" type="Const" version="opset1"> <data element_type="f16" shape="16384, 3072" offset="6417647956" size="100663296" /> <output> <port id="0" precision="FP16" names="self.model.model.layers.28.mlp.gate_up_proj.weight"> <dim>16384</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3930" name="self.model.model.layers.28.mlp.gate_up_proj.weight" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>16384</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>16384</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3931" name="__module.model.model.layers.28.mlp.gate_up_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>16384</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="5018,up_states.113"> <dim>-1</dim> <dim>-1</dim> <dim>16384</dim> </port> </output> </layer> <layer id="3932" name="__module.model.model.layers.28.mlp/prim::ListUnpack/VariadicSplit" type="VariadicSplit" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16384</dim> </port> <port id="1" precision="I64" /> <port id="2" precision="I32"> <dim>2</dim> </port> </input> <output> <port id="3" precision="FP32" names="5020,input.171"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> <port id="4" precision="FP32" names="5021,up_states.115"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> </output> </layer> <layer id="3933" name="__module.model.model.layers.28.mlp.activation_fn/aten::silu/Swish" type="Swish" version="opset4"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> </input> <output> <port id="1" precision="FP32" names="5022"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> </output> </layer> <layer id="3934" name="__module.model.model.layers.28.mlp/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> </input> <output> <port id="2" precision="FP32" names="5023"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> </output> </layer> <layer id="3935" name="self.model.model.layers.28.mlp.down_proj.weight_compressed" type="Const" version="opset1"> <data element_type="f16" shape="3072, 8192" offset="6518311252" size="50331648" /> <output> <port id="0" precision="FP16" names="self.model.model.layers.28.mlp.down_proj.weight"> <dim>3072</dim> <dim>8192</dim> </port> </output> </layer> <layer id="3936" name="self.model.model.layers.28.mlp.down_proj.weight" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>8192</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>3072</dim> <dim>8192</dim> </port> </output> </layer> <layer id="3937" name="__module.model.model.layers.28.mlp.down_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> <port id="1" precision="FP32"> <dim>3072</dim> <dim>8192</dim> </port> </input> <output> <port id="2" precision="FP32" names="5025,input.173"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3938" name="__module.model.model.layers.28/aten::add/Add_1" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="5027,5029,5037,5048,hidden_states.695,hidden_states.697"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3939" name="Constant_90327_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 3072" offset="6568642900" size="6144" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3940" name="Constant_90327" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3941" name="Constant_90326_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12314" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3942" name="Constant_90326" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3943" name="Constant_90324_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12316" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3944" name="Constant_90324" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3945" name="__module.model.model.layers.29.input_layernorm/aten::pow/Power" type="Power" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="5038"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3946" name="Constant_29239" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="12318" size="8" /> <output> <port id="0" precision="I64" names="5039"> <dim>1</dim> </port> </output> </layer> <layer id="3947" name="__module.model.model.layers.29.input_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> <data keep_dims="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="5040,variance.117"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3948" name="Constant_90325_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12326" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3949" name="Constant_90325" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3950" name="__module.model.model.layers.29.input_layernorm/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="5041"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3951" name="__module.model.model.layers.29.input_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3952" name="__module.model.model.layers.29.input_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> <data auto_broadcast="numpy" m_pythondiv="true" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="5042"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3953" name="__module.model.model.layers.29.input_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="5043,5044,hidden_states.699,hidden_states.701"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3954" name="__module.model.model.layers.29.input_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="5045,5047,hidden_states.703"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3955" name="self.model.model.layers.29.self_attn.qkv_proj.weight_compressed" type="Const" version="opset1"> <data element_type="f16" shape="9216, 3072" offset="6568649044" size="56623104" /> <output> <port id="0" precision="FP16" names="self.model.model.layers.29.self_attn.qkv_proj.weight"> <dim>9216</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3956" name="self.model.model.layers.29.self_attn.qkv_proj.weight" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>9216</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>9216</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3957" name="__module.model.model.layers.29.self_attn.qkv_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>9216</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="5054,qkv.59"> <dim>-1</dim> <dim>-1</dim> <dim>9216</dim> </port> </output> </layer> <layer id="3958" name="Constant_29282" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="2" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3959" name="Constant_29284" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635432" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3960" name="Constant_29286" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3961" name="__module.model.model.layers.29.self_attn/aten::slice/Slice" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>9216</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="5055,query_states.59"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3962" name="Constant_96704" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="56635456" size="32" /> <rt_info> <attribute name="precise" version="0" /> </rt_info> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="3963" name="__module.model.model.layers.29.self_attn/aten::view/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="5059"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> </output> </layer> <layer id="3964" name="__module.model.model.layers.29.self_attn/aten::transpose/Constant" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="56635488" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="3965" name="__module.model.model.layers.29.self_attn/aten::transpose/Transpose" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="5060,q.59"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="3966" name="__module.model.model.layers.29.self_attn/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="5109"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="3967" name="Constant_29849" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635630" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3968" name="Constant_29851" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635638" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3969" name="Constant_29853" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3970" name="__module.model.model.layers.29.self_attn/aten::slice/Slice_1" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="5119,x2.117"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="3971" name="Constant_90328_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1, 1" offset="56635654" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3972" name="Constant_90328" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="3973" name="__module.model.model.layers.29.self_attn/aten::neg/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="5120"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="3974" name="Constant_29746" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="2" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3975" name="Constant_29790" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635630" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3976" name="Constant_29792" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3977" name="__module.model.model.layers.29.self_attn/aten::slice/Slice_2" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="5114"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="3978" name="__module.model.model.layers.29.self_attn/aten::cat/Concat" type="Concat" version="opset1"> <data axis="-1" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </input> <output> <port id="2" precision="FP32" names="5122"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="3979" name="__module.model.model.layers.29.self_attn/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="5123"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="3980" name="__module.model.model.layers.29.self_attn/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="5124"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="3981" name="Constant_102914_compressed" type="Const" version="opset1"> <data element_type="f16" shape="" offset="0" size="2" /> <output> <port id="0" precision="FP16" /> </output> </layer> <layer id="3982" name="Constant_102914" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16" /> </input> <output> <port id="1" precision="FP32" /> </output> </layer> <layer id="3983" name="Constant_102907" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="10" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3984" name="Constant_102909" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="2" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3985" name="Constant_102911" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="18" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3986" name="Concat_102912" type="Concat" version="opset1"> <data axis="0" /> <input> <port id="0" precision="I64"> <dim>1</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="4" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="3987" name="Broadcast_102915" type="Broadcast" version="opset3"> <data mode="numpy" /> <input> <port id="0" precision="FP32" /> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>0</dim> <dim>96</dim> </port> </output> </layer> <layer id="3988" name="ReadValue_101135" type="ReadValue" version="opset6"> <data variable_id="past_key_values.29.keypresent.29.key" variable_type="f32" variable_shape="?,32,?,96" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>0</dim> <dim>96</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.29.key"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="3989" name="Constant_100025" type="Const" version="opset1"> <data element_type="i64" shape="" offset="2" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="3990" name="Gather_100026" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="3991" name="Constant_29292" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635432" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3992" name="Constant_29294" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635656" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3993" name="Constant_29296" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="3994" name="__module.model.model.layers.29.self_attn/aten::slice/Slice_3" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>9216</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="5056,key_states.121"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="3995" name="Constant_96705" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="56635456" size="32" /> <rt_info> <attribute name="precise" version="0" /> </rt_info> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="3996" name="__module.model.model.layers.29.self_attn/aten::view/Reshape_1" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="5062"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> </output> </layer> <layer id="3997" name="__module.model.model.layers.29.self_attn/aten::transpose/Constant_1" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="56635488" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="3998" name="__module.model.model.layers.29.self_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="5063,key_states.123"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="3999" name="__module.model.model.layers.29.self_attn/aten::mul/Multiply_2" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="5125"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="4000" name="Constant_29992" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635630" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="4001" name="Constant_29994" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635638" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="4002" name="Constant_29996" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="4003" name="__module.model.model.layers.29.self_attn/aten::slice/Slice_4" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="5135,x2.119"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="4004" name="Constant_90329_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1, 1" offset="56635654" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="4005" name="Constant_90329" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="4006" name="__module.model.model.layers.29.self_attn/aten::neg/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="5136"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="4007" name="Constant_29889" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="2" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="4008" name="Constant_29933" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635630" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="4009" name="Constant_29935" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="4010" name="__module.model.model.layers.29.self_attn/aten::slice/Slice_5" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="5130"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="4011" name="__module.model.model.layers.29.self_attn/aten::cat/Concat_1" type="Concat" version="opset1"> <data axis="-1" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </input> <output> <port id="2" precision="FP32" names="5138"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="4012" name="__module.model.model.layers.29.self_attn/aten::mul/Multiply_3" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="5139"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="4013" name="__module.model.model.layers.29.self_attn/aten::add/Add_1" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="5140"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="4014" name="__module.model.model.layers.29.self_attn/aten::cat/Concat_2" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="hidden_states.705,present.29.key"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="4015" name="Constant_102902_compressed" type="Const" version="opset1"> <data element_type="f16" shape="" offset="0" size="2" /> <output> <port id="0" precision="FP16" /> </output> </layer> <layer id="4016" name="Constant_102902" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16" /> </input> <output> <port id="1" precision="FP32" /> </output> </layer> <layer id="4017" name="Constant_102895" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="10" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="4018" name="Constant_102897" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="2" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="4019" name="Constant_102899" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="18" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="4020" name="Concat_102900" type="Concat" version="opset1"> <data axis="0" /> <input> <port id="0" precision="I64"> <dim>1</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="4" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="4021" name="Broadcast_102903" type="Broadcast" version="opset3"> <data mode="numpy" /> <input> <port id="0" precision="FP32" /> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>0</dim> <dim>96</dim> </port> </output> </layer> <layer id="4022" name="ReadValue_101137" type="ReadValue" version="opset6"> <data variable_id="past_key_values.29.valuepresent.29.value" variable_type="f32" variable_shape="?,32,?,96" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>0</dim> <dim>96</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.29.value"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="4023" name="Constant_100028" type="Const" version="opset1"> <data element_type="i64" shape="" offset="2" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="4024" name="Gather_100029" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="4025" name="Constant_29302" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635656" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="4026" name="Constant_29304" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635638" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="4027" name="Constant_29306" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="4028" name="__module.model.model.layers.29.self_attn/aten::slice/Slice_6" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>9216</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="5057,value_states.59"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4029" name="Constant_96706" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="56635456" size="32" /> <rt_info> <attribute name="precise" version="0" /> </rt_info> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="4030" name="__module.model.model.layers.29.self_attn/aten::view/Reshape_2" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="5065"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> </output> </layer> <layer id="4031" name="__module.model.model.layers.29.self_attn/aten::transpose/Constant_2" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="56635488" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="4032" name="__module.model.model.layers.29.self_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="5066"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="4033" name="__module.model.model.layers.29.self_attn/aten::cat/Concat_3" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="hidden_states.707,present.29.value"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="4034" name="__module.model.model.layers.29.self_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> <data causal="false" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="2" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="3" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>-1</dim> </port> </input> <output> <port id="4" precision="FP32" names="5150,attn_output.117"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="4035" name="__module.model.model.layers.29.self_attn/aten::transpose/Constant_3" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="56635488" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="4036" name="__module.model.model.layers.29.self_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="5151"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> </output> </layer> <layer id="4037" name="Constant_96707" type="Const" version="opset1"> <data element_type="i64" shape="3" offset="56635704" size="24" /> <rt_info> <attribute name="precise" version="0" /> </rt_info> <output> <port id="0" precision="I64"> <dim>3</dim> </port> </output> </layer> <layer id="4038" name="__module.model.model.layers.29.self_attn/aten::view/Reshape_3" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> <port id="1" precision="I64"> <dim>3</dim> </port> </input> <output> <port id="2" precision="FP32" names="5154"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4039" name="self.model.model.layers.29.self_attn.o_proj.weight_compressed" type="Const" version="opset1"> <data element_type="f16" shape="3072, 3072" offset="6625272148" size="18874368" /> <output> <port id="0" precision="FP16" names="self.model.model.layers.29.self_attn.o_proj.weight"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4040" name="self.model.model.layers.29.self_attn.o_proj.weight" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4041" name="__module.model.model.layers.29.self_attn.o_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="5156,5158,input.175"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4042" name="__module.model.model.layers.29/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="5162,5164,5175,hidden_states.709,hidden_states.711"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4043" name="Constant_90333_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 3072" offset="6644146516" size="6144" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4044" name="Constant_90333" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4045" name="Constant_90332_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12314" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="4046" name="Constant_90332" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="4047" name="Constant_90330_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12316" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="4048" name="Constant_90330" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="4049" name="__module.model.model.layers.29.post_attention_layernorm/aten::pow/Power" type="Power" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="5165"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4050" name="Constant_30164" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="12318" size="8" /> <output> <port id="0" precision="I64" names="5166"> <dim>1</dim> </port> </output> </layer> <layer id="4051" name="__module.model.model.layers.29.post_attention_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> <data keep_dims="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="5167,variance.119"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="4052" name="Constant_90331_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12326" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="4053" name="Constant_90331" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="4054" name="__module.model.model.layers.29.post_attention_layernorm/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="5168"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="4055" name="__module.model.model.layers.29.post_attention_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="4056" name="__module.model.model.layers.29.post_attention_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> <data auto_broadcast="numpy" m_pythondiv="true" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="5169"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="4057" name="__module.model.model.layers.29.post_attention_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="5170,5171,hidden_states.713,hidden_states.715"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4058" name="__module.model.model.layers.29.post_attention_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="5172,5174"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4059" name="self.model.model.layers.29.mlp.gate_up_proj.weight_compressed" type="Const" version="opset1"> <data element_type="f16" shape="16384, 3072" offset="6644152660" size="100663296" /> <output> <port id="0" precision="FP16" names="self.model.model.layers.29.mlp.gate_up_proj.weight"> <dim>16384</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4060" name="self.model.model.layers.29.mlp.gate_up_proj.weight" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>16384</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>16384</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4061" name="__module.model.model.layers.29.mlp.gate_up_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>16384</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="5179,up_states.117"> <dim>-1</dim> <dim>-1</dim> <dim>16384</dim> </port> </output> </layer> <layer id="4062" name="__module.model.model.layers.29.mlp/prim::ListUnpack/VariadicSplit" type="VariadicSplit" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16384</dim> </port> <port id="1" precision="I64" /> <port id="2" precision="I32"> <dim>2</dim> </port> </input> <output> <port id="3" precision="FP32" names="5181,input.177"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> <port id="4" precision="FP32" names="5182,up_states.119"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> </output> </layer> <layer id="4063" name="__module.model.model.layers.29.mlp.activation_fn/aten::silu/Swish" type="Swish" version="opset4"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> </input> <output> <port id="1" precision="FP32" names="5183"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> </output> </layer> <layer id="4064" name="__module.model.model.layers.29.mlp/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> </input> <output> <port id="2" precision="FP32" names="5184"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> </output> </layer> <layer id="4065" name="self.model.model.layers.29.mlp.down_proj.weight_compressed" type="Const" version="opset1"> <data element_type="f16" shape="3072, 8192" offset="6744815956" size="50331648" /> <output> <port id="0" precision="FP16" names="self.model.model.layers.29.mlp.down_proj.weight"> <dim>3072</dim> <dim>8192</dim> </port> </output> </layer> <layer id="4066" name="self.model.model.layers.29.mlp.down_proj.weight" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>8192</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>3072</dim> <dim>8192</dim> </port> </output> </layer> <layer id="4067" name="__module.model.model.layers.29.mlp.down_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> <port id="1" precision="FP32"> <dim>3072</dim> <dim>8192</dim> </port> </input> <output> <port id="2" precision="FP32" names="5186,input.179"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4068" name="__module.model.model.layers.29/aten::add/Add_1" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="5188,5190,5198,5209,hidden_states.719,hidden_states.721"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4069" name="Constant_90337_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 3072" offset="6795147604" size="6144" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4070" name="Constant_90337" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4071" name="Constant_90336_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12314" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="4072" name="Constant_90336" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="4073" name="Constant_90334_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12316" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="4074" name="Constant_90334" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="4075" name="__module.model.model.layers.30.input_layernorm/aten::pow/Power" type="Power" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="5199"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4076" name="Constant_30233" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="12318" size="8" /> <output> <port id="0" precision="I64" names="5200"> <dim>1</dim> </port> </output> </layer> <layer id="4077" name="__module.model.model.layers.30.input_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> <data keep_dims="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="5201,variance.121"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="4078" name="Constant_90335_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12326" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="4079" name="Constant_90335" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="4080" name="__module.model.model.layers.30.input_layernorm/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="5202"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="4081" name="__module.model.model.layers.30.input_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="4082" name="__module.model.model.layers.30.input_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> <data auto_broadcast="numpy" m_pythondiv="true" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="5203"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="4083" name="__module.model.model.layers.30.input_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="5204,5205,hidden_states.723,hidden_states.725"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4084" name="__module.model.model.layers.30.input_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="5206,5208,hidden_states.727"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4085" name="self.model.model.layers.30.self_attn.qkv_proj.weight_compressed" type="Const" version="opset1"> <data element_type="f16" shape="9216, 3072" offset="6795153748" size="56623104" /> <output> <port id="0" precision="FP16" names="self.model.model.layers.30.self_attn.qkv_proj.weight"> <dim>9216</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4086" name="self.model.model.layers.30.self_attn.qkv_proj.weight" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>9216</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>9216</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4087" name="__module.model.model.layers.30.self_attn.qkv_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>9216</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="5215,qkv.61"> <dim>-1</dim> <dim>-1</dim> <dim>9216</dim> </port> </output> </layer> <layer id="4088" name="Constant_30276" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="2" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="4089" name="Constant_30278" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635432" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="4090" name="Constant_30280" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="4091" name="__module.model.model.layers.30.self_attn/aten::slice/Slice" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>9216</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="5216,query_states.61"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4092" name="Constant_96708" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="56635456" size="32" /> <rt_info> <attribute name="precise" version="0" /> </rt_info> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="4093" name="__module.model.model.layers.30.self_attn/aten::view/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="5220"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> </output> </layer> <layer id="4094" name="__module.model.model.layers.30.self_attn/aten::transpose/Constant" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="56635488" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="4095" name="__module.model.model.layers.30.self_attn/aten::transpose/Transpose" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="5221,q.61"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="4096" name="__module.model.model.layers.30.self_attn/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="5270"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="4097" name="Constant_30843" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635630" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="4098" name="Constant_30845" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635638" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="4099" name="Constant_30847" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="4100" name="__module.model.model.layers.30.self_attn/aten::slice/Slice_1" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="5280,x2.121"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="4101" name="Constant_90338_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1, 1" offset="56635654" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="4102" name="Constant_90338" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="4103" name="__module.model.model.layers.30.self_attn/aten::neg/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="5281"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="4104" name="Constant_30740" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="2" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="4105" name="Constant_30784" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635630" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="4106" name="Constant_30786" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="4107" name="__module.model.model.layers.30.self_attn/aten::slice/Slice_2" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="5275"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="4108" name="__module.model.model.layers.30.self_attn/aten::cat/Concat" type="Concat" version="opset1"> <data axis="-1" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </input> <output> <port id="2" precision="FP32" names="5283"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="4109" name="__module.model.model.layers.30.self_attn/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="5284"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="4110" name="__module.model.model.layers.30.self_attn/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="5285"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="4111" name="Constant_102938_compressed" type="Const" version="opset1"> <data element_type="f16" shape="" offset="0" size="2" /> <output> <port id="0" precision="FP16" /> </output> </layer> <layer id="4112" name="Constant_102938" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16" /> </input> <output> <port id="1" precision="FP32" /> </output> </layer> <layer id="4113" name="Constant_102931" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="10" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="4114" name="Constant_102933" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="2" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="4115" name="Constant_102935" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="18" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="4116" name="Concat_102936" type="Concat" version="opset1"> <data axis="0" /> <input> <port id="0" precision="I64"> <dim>1</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="4" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="4117" name="Broadcast_102939" type="Broadcast" version="opset3"> <data mode="numpy" /> <input> <port id="0" precision="FP32" /> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>0</dim> <dim>96</dim> </port> </output> </layer> <layer id="4118" name="ReadValue_101143" type="ReadValue" version="opset6"> <data variable_id="past_key_values.30.keypresent.30.key" variable_type="f32" variable_shape="?,32,?,96" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>0</dim> <dim>96</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.30.key"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="4119" name="Constant_100031" type="Const" version="opset1"> <data element_type="i64" shape="" offset="2" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="4120" name="Gather_100032" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="4121" name="Constant_30286" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635432" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="4122" name="Constant_30288" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635656" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="4123" name="Constant_30290" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="4124" name="__module.model.model.layers.30.self_attn/aten::slice/Slice_3" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>9216</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="5217,key_states.125"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4125" name="Constant_96709" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="56635456" size="32" /> <rt_info> <attribute name="precise" version="0" /> </rt_info> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="4126" name="__module.model.model.layers.30.self_attn/aten::view/Reshape_1" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="5223"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> </output> </layer> <layer id="4127" name="__module.model.model.layers.30.self_attn/aten::transpose/Constant_1" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="56635488" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="4128" name="__module.model.model.layers.30.self_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="5224,key_states.127"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="4129" name="__module.model.model.layers.30.self_attn/aten::mul/Multiply_2" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="5286"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="4130" name="Constant_30986" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635630" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="4131" name="Constant_30988" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635638" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="4132" name="Constant_30990" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="4133" name="__module.model.model.layers.30.self_attn/aten::slice/Slice_4" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="5296,x2.123"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="4134" name="Constant_90339_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1, 1" offset="56635654" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="4135" name="Constant_90339" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="4136" name="__module.model.model.layers.30.self_attn/aten::neg/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="5297"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="4137" name="Constant_30883" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="2" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="4138" name="Constant_30927" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635630" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="4139" name="Constant_30929" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="4140" name="__module.model.model.layers.30.self_attn/aten::slice/Slice_5" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="5291"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="4141" name="__module.model.model.layers.30.self_attn/aten::cat/Concat_1" type="Concat" version="opset1"> <data axis="-1" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </input> <output> <port id="2" precision="FP32" names="5299"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="4142" name="__module.model.model.layers.30.self_attn/aten::mul/Multiply_3" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="5300"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="4143" name="__module.model.model.layers.30.self_attn/aten::add/Add_1" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="5301"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="4144" name="__module.model.model.layers.30.self_attn/aten::cat/Concat_2" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="hidden_states.729,present.30.key"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="4145" name="Constant_102926_compressed" type="Const" version="opset1"> <data element_type="f16" shape="" offset="0" size="2" /> <output> <port id="0" precision="FP16" /> </output> </layer> <layer id="4146" name="Constant_102926" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16" /> </input> <output> <port id="1" precision="FP32" /> </output> </layer> <layer id="4147" name="Constant_102919" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="10" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="4148" name="Constant_102921" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="2" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="4149" name="Constant_102923" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="18" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="4150" name="Concat_102924" type="Concat" version="opset1"> <data axis="0" /> <input> <port id="0" precision="I64"> <dim>1</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="4" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="4151" name="Broadcast_102927" type="Broadcast" version="opset3"> <data mode="numpy" /> <input> <port id="0" precision="FP32" /> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>0</dim> <dim>96</dim> </port> </output> </layer> <layer id="4152" name="ReadValue_101145" type="ReadValue" version="opset6"> <data variable_id="past_key_values.30.valuepresent.30.value" variable_type="f32" variable_shape="?,32,?,96" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>0</dim> <dim>96</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.30.value"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="4153" name="Constant_100034" type="Const" version="opset1"> <data element_type="i64" shape="" offset="2" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="4154" name="Gather_100035" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="4155" name="Constant_30296" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635656" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="4156" name="Constant_30298" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635638" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="4157" name="Constant_30300" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="4158" name="__module.model.model.layers.30.self_attn/aten::slice/Slice_6" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>9216</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="5218,value_states.61"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4159" name="Constant_96710" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="56635456" size="32" /> <rt_info> <attribute name="precise" version="0" /> </rt_info> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="4160" name="__module.model.model.layers.30.self_attn/aten::view/Reshape_2" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="5226"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> </output> </layer> <layer id="4161" name="__module.model.model.layers.30.self_attn/aten::transpose/Constant_2" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="56635488" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="4162" name="__module.model.model.layers.30.self_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="5227"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="4163" name="__module.model.model.layers.30.self_attn/aten::cat/Concat_3" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="hidden_states.731,present.30.value"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="4164" name="__module.model.model.layers.30.self_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> <data causal="false" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="2" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="3" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>-1</dim> </port> </input> <output> <port id="4" precision="FP32" names="5311,attn_output.121"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="4165" name="__module.model.model.layers.30.self_attn/aten::transpose/Constant_3" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="56635488" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="4166" name="__module.model.model.layers.30.self_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="5312"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> </output> </layer> <layer id="4167" name="Constant_96711" type="Const" version="opset1"> <data element_type="i64" shape="3" offset="56635704" size="24" /> <rt_info> <attribute name="precise" version="0" /> </rt_info> <output> <port id="0" precision="I64"> <dim>3</dim> </port> </output> </layer> <layer id="4168" name="__module.model.model.layers.30.self_attn/aten::view/Reshape_3" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> <port id="1" precision="I64"> <dim>3</dim> </port> </input> <output> <port id="2" precision="FP32" names="5315"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4169" name="self.model.model.layers.30.self_attn.o_proj.weight_compressed" type="Const" version="opset1"> <data element_type="f16" shape="3072, 3072" offset="6851776852" size="18874368" /> <output> <port id="0" precision="FP16" names="self.model.model.layers.30.self_attn.o_proj.weight"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4170" name="self.model.model.layers.30.self_attn.o_proj.weight" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4171" name="__module.model.model.layers.30.self_attn.o_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="5317,5319,input.181"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4172" name="__module.model.model.layers.30/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="5323,5325,5336,hidden_states.733,hidden_states.735"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4173" name="Constant_90343_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 3072" offset="6870651220" size="6144" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4174" name="Constant_90343" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4175" name="Constant_90342_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12314" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="4176" name="Constant_90342" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="4177" name="Constant_90340_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12316" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="4178" name="Constant_90340" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="4179" name="__module.model.model.layers.30.post_attention_layernorm/aten::pow/Power" type="Power" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="5326"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4180" name="Constant_31158" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="12318" size="8" /> <output> <port id="0" precision="I64" names="5327"> <dim>1</dim> </port> </output> </layer> <layer id="4181" name="__module.model.model.layers.30.post_attention_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> <data keep_dims="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="5328,variance.123"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="4182" name="Constant_90341_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12326" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="4183" name="Constant_90341" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="4184" name="__module.model.model.layers.30.post_attention_layernorm/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="5329"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="4185" name="__module.model.model.layers.30.post_attention_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="4186" name="__module.model.model.layers.30.post_attention_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> <data auto_broadcast="numpy" m_pythondiv="true" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="5330"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="4187" name="__module.model.model.layers.30.post_attention_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="5331,5332,hidden_states.737,hidden_states.739"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4188" name="__module.model.model.layers.30.post_attention_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="5333,5335"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4189" name="self.model.model.layers.30.mlp.gate_up_proj.weight_compressed" type="Const" version="opset1"> <data element_type="f16" shape="16384, 3072" offset="6870657364" size="100663296" /> <output> <port id="0" precision="FP16" names="self.model.model.layers.30.mlp.gate_up_proj.weight"> <dim>16384</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4190" name="self.model.model.layers.30.mlp.gate_up_proj.weight" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>16384</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>16384</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4191" name="__module.model.model.layers.30.mlp.gate_up_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>16384</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="5340,up_states.121"> <dim>-1</dim> <dim>-1</dim> <dim>16384</dim> </port> </output> </layer> <layer id="4192" name="__module.model.model.layers.30.mlp/prim::ListUnpack/VariadicSplit" type="VariadicSplit" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16384</dim> </port> <port id="1" precision="I64" /> <port id="2" precision="I32"> <dim>2</dim> </port> </input> <output> <port id="3" precision="FP32" names="5342,input.183"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> <port id="4" precision="FP32" names="5343,up_states.123"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> </output> </layer> <layer id="4193" name="__module.model.model.layers.30.mlp.activation_fn/aten::silu/Swish" type="Swish" version="opset4"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> </input> <output> <port id="1" precision="FP32" names="5344"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> </output> </layer> <layer id="4194" name="__module.model.model.layers.30.mlp/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> </input> <output> <port id="2" precision="FP32" names="5345"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> </output> </layer> <layer id="4195" name="self.model.model.layers.30.mlp.down_proj.weight_compressed" type="Const" version="opset1"> <data element_type="f16" shape="3072, 8192" offset="6971320660" size="50331648" /> <output> <port id="0" precision="FP16" names="self.model.model.layers.30.mlp.down_proj.weight"> <dim>3072</dim> <dim>8192</dim> </port> </output> </layer> <layer id="4196" name="self.model.model.layers.30.mlp.down_proj.weight" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>8192</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>3072</dim> <dim>8192</dim> </port> </output> </layer> <layer id="4197" name="__module.model.model.layers.30.mlp.down_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> <port id="1" precision="FP32"> <dim>3072</dim> <dim>8192</dim> </port> </input> <output> <port id="2" precision="FP32" names="5347,input.185"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4198" name="__module.model.model.layers.30/aten::add/Add_1" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="5349,5351,5359,5370,hidden_states.743,hidden_states.745"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4199" name="Constant_90346_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12314" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="4200" name="Constant_90346" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="4201" name="Constant_90344_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12316" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="4202" name="Constant_90344" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="4203" name="__module.model.model.layers.31.input_layernorm/aten::pow/Power" type="Power" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="5360"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4204" name="Constant_31227" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="12318" size="8" /> <output> <port id="0" precision="I64" names="5361"> <dim>1</dim> </port> </output> </layer> <layer id="4205" name="__module.model.model.layers.31.input_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> <data keep_dims="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="5362,variance.125"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="4206" name="Constant_90345_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12326" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="4207" name="Constant_90345" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="4208" name="__module.model.model.layers.31.input_layernorm/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="5363"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="4209" name="__module.model.model.layers.31.input_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="4210" name="__module.model.model.layers.31.input_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> <data auto_broadcast="numpy" m_pythondiv="true" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="5364"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="4211" name="__module.model.model.layers.31.input_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="5365,5366,hidden_states.747,hidden_states.749"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4212" name="__module.model.model.layers.31.input_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="5367,5369,hidden_states.751"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4213" name="self.model.model.layers.31.self_attn.qkv_proj.weight_compressed" type="Const" version="opset1"> <data element_type="f16" shape="9216, 3072" offset="7021652308" size="56623104" /> <output> <port id="0" precision="FP16" names="self.model.model.layers.31.self_attn.qkv_proj.weight"> <dim>9216</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4214" name="self.model.model.layers.31.self_attn.qkv_proj.weight" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>9216</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>9216</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4215" name="__module.model.model.layers.31.self_attn.qkv_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>9216</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="5376,qkv"> <dim>-1</dim> <dim>-1</dim> <dim>9216</dim> </port> </output> </layer> <layer id="4216" name="Constant_31290" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635656" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="4217" name="Constant_31292" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635638" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="4218" name="Constant_31294" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="4219" name="__module.model.model.layers.31.self_attn/aten::slice/Slice" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>9216</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="5379,value_states"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4220" name="Constant_96712" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="56635456" size="32" /> <rt_info> <attribute name="precise" version="0" /> </rt_info> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="4221" name="__module.model.model.layers.31.self_attn/aten::view/Reshape" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="5387"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> </output> </layer> <layer id="4222" name="__module.model.model.layers.31.self_attn/aten::transpose/Constant" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="56635488" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="4223" name="__module.model.model.layers.31.self_attn/aten::transpose/Transpose" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="5388"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="4224" name="__module.model.model.layers.31.self_attn/aten::cat/Concat" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="hidden_states.755,present.31.value"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="4226" name="Constant_102950_compressed" type="Const" version="opset1"> <data element_type="f16" shape="" offset="0" size="2" /> <output> <port id="0" precision="FP16" /> </output> </layer> <layer id="4227" name="Constant_102950" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16" /> </input> <output> <port id="1" precision="FP32" /> </output> </layer> <layer id="4228" name="Constant_102943" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="10" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="4229" name="Constant_102945" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="2" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="4230" name="Constant_102947" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="18" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="4231" name="Concat_102948" type="Concat" version="opset1"> <data axis="0" /> <input> <port id="0" precision="I64"> <dim>1</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="4" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="4232" name="Broadcast_102951" type="Broadcast" version="opset3"> <data mode="numpy" /> <input> <port id="0" precision="FP32" /> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>0</dim> <dim>96</dim> </port> </output> </layer> <layer id="4233" name="ReadValue_101147" type="ReadValue" version="opset6"> <data variable_id="past_key_values.31.keypresent.31.key" variable_type="f32" variable_shape="?,32,?,96" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>0</dim> <dim>96</dim> </port> </input> <output> <port id="1" precision="FP32" names="past_key_values.31.key"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="4234" name="Constant_100037" type="Const" version="opset1"> <data element_type="i64" shape="" offset="2" size="8" /> <output> <port id="0" precision="I64" /> </output> </layer> <layer id="4235" name="Gather_100038" type="Gather" version="opset8"> <data batch_dims="0" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>-1</dim> </port> <port id="2" precision="I64" /> </input> <output> <port id="3" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="4236" name="Constant_31280" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635432" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="4237" name="Constant_31282" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635656" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="4238" name="Constant_31284" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="4239" name="__module.model.model.layers.31.self_attn/aten::slice/Slice_1" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>9216</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="5378,key_states.129"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4240" name="Constant_96713" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="56635456" size="32" /> <rt_info> <attribute name="precise" version="0" /> </rt_info> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="4241" name="__module.model.model.layers.31.self_attn/aten::view/Reshape_1" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="5384"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> </output> </layer> <layer id="4242" name="__module.model.model.layers.31.self_attn/aten::transpose/Constant_1" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="56635488" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="4243" name="__module.model.model.layers.31.self_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="5385,key_states"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="4244" name="__module.model.model.layers.31.self_attn/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="5447"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="4245" name="Constant_31980" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635630" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="4246" name="Constant_31982" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635638" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="4247" name="Constant_31984" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="4248" name="__module.model.model.layers.31.self_attn/aten::slice/Slice_2" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="5457,x2"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="4249" name="Constant_90348_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1, 1" offset="56635654" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="4250" name="Constant_90348" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="4251" name="__module.model.model.layers.31.self_attn/aten::neg/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="5458"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="4252" name="Constant_31877" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="2" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="4253" name="Constant_31921" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635630" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="4254" name="Constant_31923" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="4255" name="__module.model.model.layers.31.self_attn/aten::slice/Slice_3" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="5452"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="4256" name="__module.model.model.layers.31.self_attn/aten::cat/Concat_1" type="Concat" version="opset1"> <data axis="-1" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </input> <output> <port id="2" precision="FP32" names="5460"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="4257" name="__module.model.model.layers.31.self_attn/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="5461"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="4258" name="__module.model.model.layers.31.self_attn/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="5462"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="4259" name="__module.model.model.layers.31.self_attn/aten::cat/Concat_2" type="Concat" version="opset1"> <data axis="-2" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="hidden_states.753,present.31.key"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="4311" name="Constant_90357_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 3072" offset="7078275412" size="6144" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4312" name="Constant_90357" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4313" name="Constant_31270" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="2" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="4314" name="Constant_31272" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635432" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="4315" name="Constant_31274" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="4316" name="__module.model.model.layers.31.self_attn/aten::slice/Slice_4" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>9216</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="5377,query_states"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4317" name="Constant_96714" type="Const" version="opset1"> <data element_type="i64" shape="4" offset="56635456" size="32" /> <rt_info> <attribute name="precise" version="0" /> </rt_info> <output> <port id="0" precision="I64"> <dim>4</dim> </port> </output> </layer> <layer id="4318" name="__module.model.model.layers.31.self_attn/aten::view/Reshape_2" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="5381"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> </output> </layer> <layer id="4319" name="__module.model.model.layers.31.self_attn/aten::transpose/Constant_2" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="56635488" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="4320" name="__module.model.model.layers.31.self_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="5382,q"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="4321" name="__module.model.model.layers.31.self_attn/aten::mul/Multiply_2" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="5431"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="4322" name="Constant_31837" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635630" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="4323" name="Constant_31839" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635638" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="4324" name="Constant_31841" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="4325" name="__module.model.model.layers.31.self_attn/aten::slice/Slice_5" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="5441,x2.125"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="4326" name="Constant_90349_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1, 1" offset="56635654" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="4327" name="Constant_90349" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="4328" name="__module.model.model.layers.31.self_attn/aten::neg/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="5442"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="4329" name="Constant_31734" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="2" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="4330" name="Constant_31778" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635630" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="4331" name="Constant_31780" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="56635440" size="8" /> <output> <port id="0" precision="I64"> <dim>1</dim> </port> </output> </layer> <layer id="4332" name="__module.model.model.layers.31.self_attn/aten::slice/Slice_6" type="Slice" version="opset8"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> <port id="2" precision="I64"> <dim>1</dim> </port> <port id="3" precision="I64"> <dim>1</dim> </port> <port id="4" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="5" precision="FP32" names="5436"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </output> </layer> <layer id="4333" name="__module.model.model.layers.31.self_attn/aten::cat/Concat_3" type="Concat" version="opset1"> <data axis="-1" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>48</dim> </port> </input> <output> <port id="2" precision="FP32" names="5444"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="4334" name="__module.model.model.layers.31.self_attn/aten::mul/Multiply_3" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="5445"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="4335" name="__module.model.model.layers.31.self_attn/aten::add/Add_1" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="2" precision="FP32" names="5446"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="4336" name="__module.model.model.layers.31.self_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> <data causal="false" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="2" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="3" precision="FP32"> <dim>-1</dim> <dim>1</dim> <dim>-1</dim> <dim>-1</dim> </port> </input> <output> <port id="4" precision="FP32" names="5472,attn_output.125"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="4337" name="__module.model.model.layers.31.self_attn/aten::transpose/Constant_3" type="Const" version="opset1"> <data element_type="i32" shape="4" offset="56635488" size="16" /> <output> <port id="0" precision="I32"> <dim>4</dim> </port> </output> </layer> <layer id="4338" name="__module.model.model.layers.31.self_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> <port id="1" precision="I32"> <dim>4</dim> </port> </input> <output> <port id="2" precision="FP32" names="5473"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> </output> </layer> <layer id="4339" name="Constant_96715" type="Const" version="opset1"> <data element_type="i64" shape="3" offset="56635704" size="24" /> <rt_info> <attribute name="precise" version="0" /> </rt_info> <output> <port id="0" precision="I64"> <dim>3</dim> </port> </output> </layer> <layer id="4340" name="__module.model.model.layers.31.self_attn/aten::view/Reshape_3" type="Reshape" version="opset1"> <data special_zero="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>32</dim> <dim>96</dim> </port> <port id="1" precision="I64"> <dim>3</dim> </port> </input> <output> <port id="2" precision="FP32" names="5476"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4341" name="self.model.model.layers.31.self_attn.o_proj.weight_compressed" type="Const" version="opset1"> <data element_type="f16" shape="3072, 3072" offset="7078281556" size="18874368" /> <output> <port id="0" precision="FP16" names="self.model.model.layers.31.self_attn.o_proj.weight"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4342" name="self.model.model.layers.31.self_attn.o_proj.weight" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4343" name="__module.model.model.layers.31.self_attn.o_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>3072</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="5478,5480,input.187"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4344" name="__module.model.model.layers.31/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="5484,5486,5497,hidden_states.757,hidden_states.759"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4345" name="Constant_90353_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 3072" offset="7097155924" size="6144" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4346" name="Constant_90353" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4347" name="Constant_90352_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12314" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="4348" name="Constant_90352" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="4349" name="Constant_90350_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12316" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="4350" name="Constant_90350" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="4351" name="__module.model.model.layers.31.post_attention_layernorm/aten::pow/Power" type="Power" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="5487"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4352" name="Constant_32152" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="12318" size="8" /> <output> <port id="0" precision="I64" names="5488"> <dim>1</dim> </port> </output> </layer> <layer id="4353" name="__module.model.model.layers.31.post_attention_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> <data keep_dims="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="5489,variance.127"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="4354" name="Constant_90351_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12326" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="4355" name="Constant_90351" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="4356" name="__module.model.model.layers.31.post_attention_layernorm/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="5490"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="4357" name="__module.model.model.layers.31.post_attention_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="4358" name="__module.model.model.layers.31.post_attention_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> <data auto_broadcast="numpy" m_pythondiv="true" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="5491"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="4359" name="__module.model.model.layers.31.post_attention_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="5492,5493,hidden_states.761,hidden_states.763"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4360" name="__module.model.model.layers.31.post_attention_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="5494,5496"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4361" name="self.model.model.layers.31.mlp.gate_up_proj.weight_compressed" type="Const" version="opset1"> <data element_type="f16" shape="16384, 3072" offset="7097162068" size="100663296" /> <output> <port id="0" precision="FP16" names="self.model.model.layers.31.mlp.gate_up_proj.weight"> <dim>16384</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4362" name="self.model.model.layers.31.mlp.gate_up_proj.weight" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>16384</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>16384</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4363" name="__module.model.model.layers.31.mlp.gate_up_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>16384</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="5501,up_states.125"> <dim>-1</dim> <dim>-1</dim> <dim>16384</dim> </port> </output> </layer> <layer id="4364" name="__module.model.model.layers.31.mlp/prim::ListUnpack/VariadicSplit" type="VariadicSplit" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>16384</dim> </port> <port id="1" precision="I64" /> <port id="2" precision="I32"> <dim>2</dim> </port> </input> <output> <port id="3" precision="FP32" names="5503,input.189"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> <port id="4" precision="FP32" names="5504,up_states"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> </output> </layer> <layer id="4365" name="__module.model.model.layers.31.mlp.activation_fn/aten::silu/Swish" type="Swish" version="opset4"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> </input> <output> <port id="1" precision="FP32" names="5505"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> </output> </layer> <layer id="4366" name="__module.model.model.layers.31.mlp/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> </input> <output> <port id="2" precision="FP32" names="5506"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> </output> </layer> <layer id="4367" name="self.model.model.layers.31.mlp.down_proj.weight_compressed" type="Const" version="opset1"> <data element_type="f16" shape="3072, 8192" offset="7197825364" size="50331648" /> <output> <port id="0" precision="FP16" names="self.model.model.layers.31.mlp.down_proj.weight"> <dim>3072</dim> <dim>8192</dim> </port> </output> </layer> <layer id="4368" name="self.model.model.layers.31.mlp.down_proj.weight" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>3072</dim> <dim>8192</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>3072</dim> <dim>8192</dim> </port> </output> </layer> <layer id="4369" name="__module.model.model.layers.31.mlp.down_proj/aten::linear/MatMul" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>8192</dim> </port> <port id="1" precision="FP32"> <dim>3072</dim> <dim>8192</dim> </port> </input> <output> <port id="2" precision="FP32" names="5508,input"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4370" name="__module.model.model.layers.31/aten::add/Add_1" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="5510,5512,5516,hidden_states.767,hidden_states.769"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4371" name="Constant_90356_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12314" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="4372" name="Constant_90356" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="4373" name="Constant_90354_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12316" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="4374" name="Constant_90354" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="4375" name="__module.model.model.norm/aten::pow/Power" type="Power" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="5517"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4376" name="Constant_32217" type="Const" version="opset1"> <data element_type="i64" shape="1" offset="12318" size="8" /> <output> <port id="0" precision="I64" names="5518"> <dim>1</dim> </port> </output> </layer> <layer id="4377" name="__module.model.model.norm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> <data keep_dims="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="I64"> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="5519,variance"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="4378" name="Constant_90355_compressed" type="Const" version="opset1"> <data element_type="f16" shape="1, 1, 1" offset="12326" size="2" /> <output> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="4379" name="Constant_90355" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </output> </layer> <layer id="4380" name="__module.model.model.norm/aten::add/Add" type="Add" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="5520"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="4381" name="__module.model.model.norm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="4382" name="__module.model.model.norm/aten::rsqrt/Divide" type="Divide" version="opset1"> <data auto_broadcast="numpy" m_pythondiv="true" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>1</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="5521"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </output> </layer> <layer id="4383" name="__module.model.model.norm/aten::mul/Multiply" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>1</dim> </port> </input> <output> <port id="2" precision="FP32" names="5522,5523,hidden_states,hidden_states.771"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4384" name="__module.model.model.norm/aten::mul/Multiply_1" type="Multiply" version="opset1"> <data auto_broadcast="numpy" /> <input> <port id="0" precision="FP32"> <dim>1</dim> <dim>1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="5524,5526"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4385" name="self.model.lm_head.weight_compressed" type="Const" version="opset1"> <data element_type="f16" shape="32064, 3072" offset="7248157012" size="197001216" /> <output> <port id="0" precision="FP16" names="self.model.lm_head.weight"> <dim>32064</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4386" name="self.model.lm_head.weight" type="Convert" version="opset1"> <data destination_type="f32" /> <rt_info> <attribute name="decompression" version="0" /> </rt_info> <input> <port id="0" precision="FP16"> <dim>32064</dim> <dim>3072</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>32064</dim> <dim>3072</dim> </port> </output> </layer> <layer id="4387" name="__module.model/aten::to/Convert" type="MatMul" version="opset1"> <data transpose_a="false" transpose_b="true" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>3072</dim> </port> <port id="1" precision="FP32"> <dim>32064</dim> <dim>3072</dim> </port> </input> <output> <port id="2" precision="FP32" names="logits"> <dim>-1</dim> <dim>-1</dim> <dim>32064</dim> </port> </output> </layer> <layer id="4310" name="Assign_101048" type="Assign" version="opset6"> <data variable_id="past_key_values.0.keypresent.0.key" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="4309" name="Assign_101050" type="Assign" version="opset6"> <data variable_id="past_key_values.0.valuepresent.0.value" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="4308" name="Assign_101052" type="Assign" version="opset6"> <data variable_id="past_key_values.1.keypresent.1.key" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="4307" name="Assign_101054" type="Assign" version="opset6"> <data variable_id="past_key_values.1.valuepresent.1.value" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="4306" name="Assign_101056" type="Assign" version="opset6"> <data variable_id="past_key_values.10.keypresent.10.key" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="4305" name="Assign_101058" type="Assign" version="opset6"> <data variable_id="past_key_values.10.valuepresent.10.value" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="4304" name="Assign_101060" type="Assign" version="opset6"> <data variable_id="past_key_values.11.keypresent.11.key" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="4303" name="Assign_101062" type="Assign" version="opset6"> <data variable_id="past_key_values.11.valuepresent.11.value" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="4302" name="Assign_101064" type="Assign" version="opset6"> <data variable_id="past_key_values.12.keypresent.12.key" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="4301" name="Assign_101066" type="Assign" version="opset6"> <data variable_id="past_key_values.12.valuepresent.12.value" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="4300" name="Assign_101068" type="Assign" version="opset6"> <data variable_id="past_key_values.13.keypresent.13.key" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="4299" name="Assign_101070" type="Assign" version="opset6"> <data variable_id="past_key_values.13.valuepresent.13.value" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="4298" name="Assign_101072" type="Assign" version="opset6"> <data variable_id="past_key_values.14.keypresent.14.key" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="4297" name="Assign_101074" type="Assign" version="opset6"> <data variable_id="past_key_values.14.valuepresent.14.value" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="4296" name="Assign_101076" type="Assign" version="opset6"> <data variable_id="past_key_values.15.keypresent.15.key" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="4295" name="Assign_101078" type="Assign" version="opset6"> <data variable_id="past_key_values.15.valuepresent.15.value" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="4294" name="Assign_101080" type="Assign" version="opset6"> <data variable_id="past_key_values.16.keypresent.16.key" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="4293" name="Assign_101082" type="Assign" version="opset6"> <data variable_id="past_key_values.16.valuepresent.16.value" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="4292" name="Assign_101084" type="Assign" version="opset6"> <data variable_id="past_key_values.17.keypresent.17.key" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="4291" name="Assign_101086" type="Assign" version="opset6"> <data variable_id="past_key_values.17.valuepresent.17.value" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="4290" name="Assign_101088" type="Assign" version="opset6"> <data variable_id="past_key_values.18.keypresent.18.key" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="4289" name="Assign_101090" type="Assign" version="opset6"> <data variable_id="past_key_values.18.valuepresent.18.value" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="4288" name="Assign_101092" type="Assign" version="opset6"> <data variable_id="past_key_values.19.keypresent.19.key" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="4287" name="Assign_101094" type="Assign" version="opset6"> <data variable_id="past_key_values.19.valuepresent.19.value" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="4286" name="Assign_101096" type="Assign" version="opset6"> <data variable_id="past_key_values.2.keypresent.2.key" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="4285" name="Assign_101098" type="Assign" version="opset6"> <data variable_id="past_key_values.2.valuepresent.2.value" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="4284" name="Assign_101100" type="Assign" version="opset6"> <data variable_id="past_key_values.20.keypresent.20.key" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="4283" name="Assign_101102" type="Assign" version="opset6"> <data variable_id="past_key_values.20.valuepresent.20.value" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="4282" name="Assign_101104" type="Assign" version="opset6"> <data variable_id="past_key_values.21.keypresent.21.key" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="4281" name="Assign_101106" type="Assign" version="opset6"> <data variable_id="past_key_values.21.valuepresent.21.value" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="4280" name="Assign_101108" type="Assign" version="opset6"> <data variable_id="past_key_values.22.keypresent.22.key" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="4279" name="Assign_101110" type="Assign" version="opset6"> <data variable_id="past_key_values.22.valuepresent.22.value" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="4278" name="Assign_101112" type="Assign" version="opset6"> <data variable_id="past_key_values.23.keypresent.23.key" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="4277" name="Assign_101114" type="Assign" version="opset6"> <data variable_id="past_key_values.23.valuepresent.23.value" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="4276" name="Assign_101116" type="Assign" version="opset6"> <data variable_id="past_key_values.24.keypresent.24.key" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="4275" name="Assign_101118" type="Assign" version="opset6"> <data variable_id="past_key_values.24.valuepresent.24.value" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="4274" name="Assign_101120" type="Assign" version="opset6"> <data variable_id="past_key_values.25.keypresent.25.key" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="4273" name="Assign_101122" type="Assign" version="opset6"> <data variable_id="past_key_values.25.valuepresent.25.value" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="4272" name="Assign_101124" type="Assign" version="opset6"> <data variable_id="past_key_values.26.keypresent.26.key" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="4271" name="Assign_101126" type="Assign" version="opset6"> <data variable_id="past_key_values.26.valuepresent.26.value" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="4270" name="Assign_101128" type="Assign" version="opset6"> <data variable_id="past_key_values.27.keypresent.27.key" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="4269" name="Assign_101130" type="Assign" version="opset6"> <data variable_id="past_key_values.27.valuepresent.27.value" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="4268" name="Assign_101132" type="Assign" version="opset6"> <data variable_id="past_key_values.28.keypresent.28.key" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="4267" name="Assign_101134" type="Assign" version="opset6"> <data variable_id="past_key_values.28.valuepresent.28.value" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="4266" name="Assign_101136" type="Assign" version="opset6"> <data variable_id="past_key_values.29.keypresent.29.key" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="4265" name="Assign_101138" type="Assign" version="opset6"> <data variable_id="past_key_values.29.valuepresent.29.value" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="4264" name="Assign_101140" type="Assign" version="opset6"> <data variable_id="past_key_values.3.keypresent.3.key" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="4263" name="Assign_101142" type="Assign" version="opset6"> <data variable_id="past_key_values.3.valuepresent.3.value" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="4262" name="Assign_101144" type="Assign" version="opset6"> <data variable_id="past_key_values.30.keypresent.30.key" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="4261" name="Assign_101146" type="Assign" version="opset6"> <data variable_id="past_key_values.30.valuepresent.30.value" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="4260" name="Assign_101148" type="Assign" version="opset6"> <data variable_id="past_key_values.31.keypresent.31.key" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="4225" name="Assign_101150" type="Assign" version="opset6"> <data variable_id="past_key_values.31.valuepresent.31.value" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="1398" name="Assign_101152" type="Assign" version="opset6"> <data variable_id="past_key_values.4.keypresent.4.key" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="1397" name="Assign_101154" type="Assign" version="opset6"> <data variable_id="past_key_values.4.valuepresent.4.value" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="1396" name="Assign_101156" type="Assign" version="opset6"> <data variable_id="past_key_values.5.keypresent.5.key" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="1395" name="Assign_101158" type="Assign" version="opset6"> <data variable_id="past_key_values.5.valuepresent.5.value" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="1394" name="Assign_101160" type="Assign" version="opset6"> <data variable_id="past_key_values.6.keypresent.6.key" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="1393" name="Assign_101162" type="Assign" version="opset6"> <data variable_id="past_key_values.6.valuepresent.6.value" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="1392" name="Assign_101164" type="Assign" version="opset6"> <data variable_id="past_key_values.7.keypresent.7.key" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="1391" name="Assign_101166" type="Assign" version="opset6"> <data variable_id="past_key_values.7.valuepresent.7.value" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="1390" name="Assign_101168" type="Assign" version="opset6"> <data variable_id="past_key_values.8.keypresent.8.key" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="1389" name="Assign_101170" type="Assign" version="opset6"> <data variable_id="past_key_values.8.valuepresent.8.value" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="1388" name="Assign_101172" type="Assign" version="opset6"> <data variable_id="past_key_values.9.keypresent.9.key" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="1353" name="Assign_101174" type="Assign" version="opset6"> <data variable_id="past_key_values.9.valuepresent.9.value" /> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </input> <output> <port id="1" precision="FP32"> <dim>-1</dim> <dim>32</dim> <dim>-1</dim> <dim>96</dim> </port> </output> </layer> <layer id="4388" name="Result_32684" type="Result" version="opset1"> <input> <port id="0" precision="FP32"> <dim>-1</dim> <dim>-1</dim> <dim>32064</dim> </port> </input> </layer> </layers> <edges> <edge from-layer="0" from-port="0" to-layer="1282" to-port="1" /> <edge from-layer="0" from-port="0" to-layer="3894" to-port="1" /> <edge from-layer="0" from-port="0" to-layer="136" to-port="1" /> <edge from-layer="0" from-port="0" to-layer="1118" to-port="1" /> <edge from-layer="0" from-port="0" to-layer="3860" to-port="1" /> <edge from-layer="0" from-port="0" to-layer="1152" to-port="1" /> <edge from-layer="0" from-port="0" to-layer="3764" to-port="1" /> <edge from-layer="0" from-port="0" to-layer="1248" to-port="1" /> <edge from-layer="0" from-port="0" to-layer="3730" to-port="1" /> <edge from-layer="0" from-port="0" to-layer="3990" to-port="1" /> <edge from-layer="0" from-port="0" to-layer="3634" to-port="1" /> <edge from-layer="0" from-port="0" to-layer="1363" to-port="1" /> <edge from-layer="0" from-port="0" to-layer="3600" to-port="1" /> <edge from-layer="0" from-port="0" to-layer="1408" to-port="1" /> <edge from-layer="0" from-port="0" to-layer="3504" to-port="1" /> <edge from-layer="0" from-port="0" to-layer="3470" to-port="1" /> <edge from-layer="0" from-port="0" to-layer="372" to-port="1" /> <edge from-layer="0" from-port="0" to-layer="1520" to-port="1" /> <edge from-layer="0" from-port="0" to-layer="1022" to-port="1" /> <edge from-layer="0" from-port="0" to-layer="988" to-port="1" /> <edge from-layer="0" from-port="0" to-layer="4024" to-port="1" /> <edge from-layer="0" from-port="0" to-layer="892" to-port="1" /> <edge from-layer="0" from-port="0" to-layer="4120" to-port="1" /> <edge from-layer="0" from-port="0" to-layer="858" to-port="1" /> <edge from-layer="0" from-port="0" to-layer="4154" to-port="1" /> <edge from-layer="0" from-port="0" to-layer="4235" to-port="1" /> <edge from-layer="0" from-port="0" to-layer="102" to-port="1" /> <edge from-layer="0" from-port="0" to-layer="762" to-port="1" /> <edge from-layer="0" from-port="0" to-layer="728" to-port="1" /> <edge from-layer="0" from-port="0" to-layer="632" to-port="1" /> <edge from-layer="0" from-port="0" to-layer="598" to-port="1" /> <edge from-layer="0" from-port="0" to-layer="468" to-port="1" /> <edge from-layer="0" from-port="0" to-layer="502" to-port="1" /> <edge from-layer="0" from-port="0" to-layer="2854" to-port="1" /> <edge from-layer="0" from-port="0" to-layer="2334" to-port="1" /> <edge from-layer="0" from-port="0" to-layer="2300" to-port="1" /> <edge from-layer="0" from-port="0" to-layer="2430" to-port="1" /> <edge from-layer="0" from-port="0" to-layer="2464" to-port="1" /> <edge from-layer="0" from-port="0" to-layer="2204" to-port="1" /> <edge from-layer="0" from-port="0" to-layer="2560" to-port="1" /> <edge from-layer="0" from-port="0" to-layer="2170" to-port="1" /> <edge from-layer="0" from-port="0" to-layer="2594" to-port="1" /> <edge from-layer="0" from-port="0" to-layer="2074" to-port="1" /> <edge from-layer="0" from-port="0" to-layer="2690" to-port="1" /> <edge from-layer="0" from-port="0" to-layer="2724" to-port="1" /> <edge from-layer="0" from-port="0" to-layer="17" to-port="1" /> <edge from-layer="0" from-port="0" to-layer="2040" to-port="1" /> <edge from-layer="0" from-port="0" to-layer="2820" to-port="1" /> <edge from-layer="0" from-port="0" to-layer="1944" to-port="1" /> <edge from-layer="0" from-port="0" to-layer="1780" to-port="1" /> <edge from-layer="0" from-port="0" to-layer="3374" to-port="1" /> <edge from-layer="0" from-port="0" to-layer="3340" to-port="1" /> <edge from-layer="0" from-port="0" to-layer="1554" to-port="1" /> <edge from-layer="0" from-port="0" to-layer="3244" to-port="1" /> <edge from-layer="0" from-port="0" to-layer="1650" to-port="1" /> <edge from-layer="0" from-port="0" to-layer="3210" to-port="1" /> <edge from-layer="0" from-port="0" to-layer="1684" to-port="1" /> <edge from-layer="0" from-port="0" to-layer="3114" to-port="1" /> <edge from-layer="0" from-port="0" to-layer="3080" to-port="1" /> <edge from-layer="0" from-port="0" to-layer="338" to-port="1" /> <edge from-layer="0" from-port="0" to-layer="2984" to-port="1" /> <edge from-layer="0" from-port="0" to-layer="1814" to-port="1" /> <edge from-layer="0" from-port="0" to-layer="2950" to-port="1" /> <edge from-layer="0" from-port="0" to-layer="1910" to-port="1" /> <edge from-layer="1" from-port="0" to-layer="6" to-port="0" /> <edge from-layer="1" from-port="0" to-layer="248" to-port="0" /> <edge from-layer="1" from-port="0" to-layer="34" to-port="0" /> <edge from-layer="1" from-port="0" to-layer="26" to-port="0" /> <edge from-layer="1" from-port="0" to-layer="50" to-port="0" /> <edge from-layer="2" from-port="0" to-layer="59" to-port="0" /> <edge from-layer="3" from-port="0" to-layer="148" to-port="0" /> <edge from-layer="3" from-port="0" to-layer="157" to-port="0" /> <edge from-layer="4" from-port="0" to-layer="5" to-port="0" /> <edge from-layer="5" from-port="1" to-layer="14" to-port="0" /> <edge from-layer="6" from-port="1" to-layer="9" to-port="0" /> <edge from-layer="7" from-port="0" to-layer="9" to-port="1" /> <edge from-layer="8" from-port="0" to-layer="9" to-port="2" /> <edge from-layer="9" from-port="3" to-layer="4116" to-port="0" /> <edge from-layer="9" from-port="3" to-layer="4150" to-port="0" /> <edge from-layer="9" from-port="3" to-layer="2166" to-port="0" /> <edge from-layer="9" from-port="3" to-layer="4020" to-port="0" /> <edge from-layer="9" from-port="3" to-layer="984" to-port="0" /> <edge from-layer="9" from-port="3" to-layer="2980" to-port="0" /> <edge from-layer="9" from-port="3" to-layer="1810" to-port="0" /> <edge from-layer="9" from-port="3" to-layer="3336" to-port="0" /> <edge from-layer="9" from-port="3" to-layer="854" to-port="0" /> <edge from-layer="9" from-port="3" to-layer="334" to-port="0" /> <edge from-layer="9" from-port="3" to-layer="2946" to-port="0" /> <edge from-layer="9" from-port="3" to-layer="888" to-port="0" /> <edge from-layer="9" from-port="3" to-layer="2296" to-port="0" /> <edge from-layer="9" from-port="3" to-layer="1516" to-port="0" /> <edge from-layer="9" from-port="3" to-layer="3630" to-port="0" /> <edge from-layer="9" from-port="3" to-layer="2590" to-port="0" /> <edge from-layer="9" from-port="3" to-layer="3890" to-port="0" /> <edge from-layer="9" from-port="3" to-layer="3206" to-port="0" /> <edge from-layer="9" from-port="3" to-layer="1680" to-port="0" /> <edge from-layer="9" from-port="3" to-layer="3760" to-port="0" /> <edge from-layer="9" from-port="3" to-layer="3856" to-port="0" /> <edge from-layer="9" from-port="3" to-layer="1244" to-port="0" /> <edge from-layer="9" from-port="3" to-layer="1646" to-port="0" /> <edge from-layer="9" from-port="3" to-layer="1148" to-port="0" /> <edge from-layer="9" from-port="3" to-layer="3240" to-port="0" /> <edge from-layer="9" from-port="3" to-layer="3110" to-port="0" /> <edge from-layer="9" from-port="3" to-layer="1278" to-port="0" /> <edge from-layer="9" from-port="3" to-layer="1776" to-port="0" /> <edge from-layer="9" from-port="3" to-layer="1114" to-port="0" /> <edge from-layer="9" from-port="3" to-layer="2460" to-port="0" /> <edge from-layer="9" from-port="3" to-layer="132" to-port="0" /> <edge from-layer="9" from-port="3" to-layer="3986" to-port="0" /> <edge from-layer="9" from-port="3" to-layer="3076" to-port="0" /> <edge from-layer="9" from-port="3" to-layer="3726" to-port="0" /> <edge from-layer="9" from-port="3" to-layer="1018" to-port="0" /> <edge from-layer="9" from-port="3" to-layer="3500" to-port="0" /> <edge from-layer="9" from-port="3" to-layer="2816" to-port="0" /> <edge from-layer="9" from-port="3" to-layer="724" to-port="0" /> <edge from-layer="9" from-port="3" to-layer="13" to-port="0" /> <edge from-layer="9" from-port="3" to-layer="1404" to-port="0" /> <edge from-layer="9" from-port="3" to-layer="2556" to-port="0" /> <edge from-layer="9" from-port="3" to-layer="1906" to-port="0" /> <edge from-layer="9" from-port="3" to-layer="2036" to-port="0" /> <edge from-layer="9" from-port="3" to-layer="628" to-port="0" /> <edge from-layer="9" from-port="3" to-layer="464" to-port="0" /> <edge from-layer="9" from-port="3" to-layer="4231" to-port="0" /> <edge from-layer="9" from-port="3" to-layer="3370" to-port="0" /> <edge from-layer="9" from-port="3" to-layer="594" to-port="0" /> <edge from-layer="9" from-port="3" to-layer="2070" to-port="0" /> <edge from-layer="9" from-port="3" to-layer="2720" to-port="0" /> <edge from-layer="9" from-port="3" to-layer="2330" to-port="0" /> <edge from-layer="9" from-port="3" to-layer="2200" to-port="0" /> <edge from-layer="9" from-port="3" to-layer="2686" to-port="0" /> <edge from-layer="9" from-port="3" to-layer="3466" to-port="0" /> <edge from-layer="9" from-port="3" to-layer="498" to-port="0" /> <edge from-layer="9" from-port="3" to-layer="1359" to-port="0" /> <edge from-layer="9" from-port="3" to-layer="1550" to-port="0" /> <edge from-layer="9" from-port="3" to-layer="368" to-port="0" /> <edge from-layer="9" from-port="3" to-layer="2426" to-port="0" /> <edge from-layer="9" from-port="3" to-layer="758" to-port="0" /> <edge from-layer="9" from-port="3" to-layer="2850" to-port="0" /> <edge from-layer="9" from-port="3" to-layer="98" to-port="0" /> <edge from-layer="9" from-port="3" to-layer="3596" to-port="0" /> <edge from-layer="9" from-port="3" to-layer="1940" to-port="0" /> <edge from-layer="10" from-port="0" to-layer="13" to-port="1" /> <edge from-layer="11" from-port="0" to-layer="13" to-port="2" /> <edge from-layer="12" from-port="0" to-layer="13" to-port="3" /> <edge from-layer="13" from-port="4" to-layer="14" to-port="1" /> <edge from-layer="14" from-port="2" to-layer="15" to-port="0" /> <edge from-layer="15" from-port="1" to-layer="17" to-port="0" /> <edge from-layer="16" from-port="0" to-layer="17" to-port="2" /> <edge from-layer="17" from-port="3" to-layer="1352" to-port="0" /> <edge from-layer="18" from-port="0" to-layer="19" to-port="0" /> <edge from-layer="19" from-port="1" to-layer="1340" to-port="0" /> <edge from-layer="20" from-port="0" to-layer="21" to-port="0" /> <edge from-layer="21" from-port="1" to-layer="35" to-port="0" /> <edge from-layer="22" from-port="0" to-layer="23" to-port="0" /> <edge from-layer="23" from-port="1" to-layer="33" to-port="0" /> <edge from-layer="24" from-port="0" to-layer="25" to-port="0" /> <edge from-layer="25" from-port="1" to-layer="26" to-port="1" /> <edge from-layer="26" from-port="2" to-layer="28" to-port="0" /> <edge from-layer="27" from-port="0" to-layer="28" to-port="1" /> <edge from-layer="28" from-port="2" to-layer="31" to-port="0" /> <edge from-layer="29" from-port="0" to-layer="30" to-port="0" /> <edge from-layer="30" from-port="1" to-layer="31" to-port="1" /> <edge from-layer="31" from-port="2" to-layer="32" to-port="0" /> <edge from-layer="32" from-port="1" to-layer="33" to-port="1" /> <edge from-layer="33" from-port="2" to-layer="34" to-port="1" /> <edge from-layer="34" from-port="2" to-layer="35" to-port="1" /> <edge from-layer="35" from-port="2" to-layer="38" to-port="0" /> <edge from-layer="36" from-port="0" to-layer="37" to-port="0" /> <edge from-layer="37" from-port="1" to-layer="38" to-port="1" /> <edge from-layer="38" from-port="2" to-layer="106" to-port="0" /> <edge from-layer="38" from-port="2" to-layer="140" to-port="0" /> <edge from-layer="38" from-port="2" to-layer="43" to-port="0" /> <edge from-layer="39" from-port="0" to-layer="43" to-port="1" /> <edge from-layer="40" from-port="0" to-layer="43" to-port="2" /> <edge from-layer="41" from-port="0" to-layer="43" to-port="3" /> <edge from-layer="42" from-port="0" to-layer="2728" to-port="4" /> <edge from-layer="42" from-port="0" to-layer="1914" to-port="4" /> <edge from-layer="42" from-port="0" to-layer="2824" to-port="4" /> <edge from-layer="42" from-port="0" to-layer="1948" to-port="4" /> <edge from-layer="42" from-port="0" to-layer="2011" to-port="4" /> <edge from-layer="42" from-port="0" to-layer="2598" to-port="4" /> <edge from-layer="42" from-port="0" to-layer="1524" to-port="4" /> <edge from-layer="42" from-port="0" to-layer="2791" to-port="4" /> <edge from-layer="42" from-port="0" to-layer="2921" to-port="4" /> <edge from-layer="42" from-port="0" to-layer="2661" to-port="4" /> <edge from-layer="42" from-port="0" to-layer="2044" to-port="4" /> <edge from-layer="42" from-port="0" to-layer="3378" to-port="4" /> <edge from-layer="42" from-port="0" to-layer="3441" to-port="4" /> <edge from-layer="42" from-port="0" to-layer="2141" to-port="4" /> <edge from-layer="42" from-port="0" to-layer="309" to-port="4" /> <edge from-layer="42" from-port="0" to-layer="2694" to-port="4" /> <edge from-layer="42" from-port="0" to-layer="2078" to-port="4" /> <edge from-layer="42" from-port="0" to-layer="43" to-port="4" /> <edge from-layer="42" from-port="0" to-layer="342" to-port="4" /> <edge from-layer="42" from-port="0" to-layer="1654" to-port="4" /> <edge from-layer="42" from-port="0" to-layer="3214" to-port="4" /> <edge from-layer="42" from-port="0" to-layer="1688" to-port="4" /> <edge from-layer="42" from-port="0" to-layer="1751" to-port="4" /> <edge from-layer="42" from-port="0" to-layer="3181" to-port="4" /> <edge from-layer="42" from-port="0" to-layer="3118" to-port="4" /> <edge from-layer="42" from-port="0" to-layer="2174" to-port="4" /> <edge from-layer="42" from-port="0" to-layer="3248" to-port="4" /> <edge from-layer="42" from-port="0" to-layer="3311" to-port="4" /> <edge from-layer="42" from-port="0" to-layer="3084" to-port="4" /> <edge from-layer="42" from-port="0" to-layer="2858" to-port="4" /> <edge from-layer="42" from-port="0" to-layer="1784" to-port="4" /> <edge from-layer="42" from-port="0" to-layer="1621" to-port="4" /> <edge from-layer="42" from-port="0" to-layer="1558" to-port="4" /> <edge from-layer="42" from-port="0" to-layer="3051" to-port="4" /> <edge from-layer="42" from-port="0" to-layer="2988" to-port="4" /> <edge from-layer="42" from-port="0" to-layer="1818" to-port="4" /> <edge from-layer="42" from-port="0" to-layer="1881" to-port="4" /> <edge from-layer="42" from-port="0" to-layer="2954" to-port="4" /> <edge from-layer="42" from-port="0" to-layer="3344" to-port="4" /> <edge from-layer="42" from-port="0" to-layer="2564" to-port="4" /> <edge from-layer="42" from-port="0" to-layer="4028" to-port="4" /> <edge from-layer="42" from-port="0" to-layer="4158" to-port="4" /> <edge from-layer="42" from-port="0" to-layer="106" to-port="4" /> <edge from-layer="42" from-port="0" to-layer="862" to-port="4" /> <edge from-layer="42" from-port="0" to-layer="4124" to-port="4" /> <edge from-layer="42" from-port="0" to-layer="896" to-port="4" /> <edge from-layer="42" from-port="0" to-layer="959" to-port="4" /> <edge from-layer="42" from-port="0" to-layer="2271" to-port="4" /> <edge from-layer="42" from-port="0" to-layer="4091" to-port="4" /> <edge from-layer="42" from-port="0" to-layer="4219" to-port="4" /> <edge from-layer="42" from-port="0" to-layer="992" to-port="4" /> <edge from-layer="42" from-port="0" to-layer="2208" to-port="4" /> <edge from-layer="42" from-port="0" to-layer="3994" to-port="4" /> <edge from-layer="42" from-port="0" to-layer="1026" to-port="4" /> <edge from-layer="42" from-port="0" to-layer="1089" to-port="4" /> <edge from-layer="42" from-port="0" to-layer="3961" to-port="4" /> <edge from-layer="42" from-port="0" to-layer="3898" to-port="4" /> <edge from-layer="42" from-port="0" to-layer="699" to-port="4" /> <edge from-layer="42" from-port="0" to-layer="2338" to-port="4" /> <edge from-layer="42" from-port="0" to-layer="2401" to-port="4" /> <edge from-layer="42" from-port="0" to-layer="472" to-port="4" /> <edge from-layer="42" from-port="0" to-layer="506" to-port="4" /> <edge from-layer="42" from-port="0" to-layer="569" to-port="4" /> <edge from-layer="42" from-port="0" to-layer="602" to-port="4" /> <edge from-layer="42" from-port="0" to-layer="2304" to-port="4" /> <edge from-layer="42" from-port="0" to-layer="636" to-port="4" /> <edge from-layer="42" from-port="0" to-layer="1491" to-port="4" /> <edge from-layer="42" from-port="0" to-layer="732" to-port="4" /> <edge from-layer="42" from-port="0" to-layer="4316" to-port="4" /> <edge from-layer="42" from-port="0" to-layer="766" to-port="4" /> <edge from-layer="42" from-port="0" to-layer="829" to-port="4" /> <edge from-layer="42" from-port="0" to-layer="2434" to-port="4" /> <edge from-layer="42" from-port="0" to-layer="439" to-port="4" /> <edge from-layer="42" from-port="0" to-layer="4239" to-port="4" /> <edge from-layer="42" from-port="0" to-layer="3508" to-port="4" /> <edge from-layer="42" from-port="0" to-layer="1286" to-port="4" /> <edge from-layer="42" from-port="0" to-layer="3701" to-port="4" /> <edge from-layer="42" from-port="0" to-layer="3734" to-port="4" /> <edge from-layer="42" from-port="0" to-layer="3638" to-port="4" /> <edge from-layer="42" from-port="0" to-layer="1347" to-port="4" /> <edge from-layer="42" from-port="0" to-layer="2531" to-port="4" /> <edge from-layer="42" from-port="0" to-layer="1252" to-port="4" /> <edge from-layer="42" from-port="0" to-layer="3604" to-port="4" /> <edge from-layer="42" from-port="0" to-layer="1367" to-port="4" /> <edge from-layer="42" from-port="0" to-layer="3571" to-port="4" /> <edge from-layer="42" from-port="0" to-layer="3768" to-port="4" /> <edge from-layer="42" from-port="0" to-layer="3831" to-port="4" /> <edge from-layer="42" from-port="0" to-layer="1414" to-port="4" /> <edge from-layer="42" from-port="0" to-layer="1219" to-port="4" /> <edge from-layer="42" from-port="0" to-layer="3474" to-port="4" /> <edge from-layer="42" from-port="0" to-layer="1122" to-port="4" /> <edge from-layer="42" from-port="0" to-layer="140" to-port="4" /> <edge from-layer="42" from-port="0" to-layer="376" to-port="4" /> <edge from-layer="42" from-port="0" to-layer="3864" to-port="4" /> <edge from-layer="42" from-port="0" to-layer="1156" to-port="4" /> <edge from-layer="42" from-port="0" to-layer="2468" to-port="4" /> <edge from-layer="43" from-port="5" to-layer="45" to-port="0" /> <edge from-layer="44" from-port="0" to-layer="45" to-port="1" /> <edge from-layer="45" from-port="2" to-layer="47" to-port="0" /> <edge from-layer="46" from-port="0" to-layer="47" to-port="1" /> <edge from-layer="47" from-port="2" to-layer="84" to-port="0" /> <edge from-layer="47" from-port="2" to-layer="77" to-port="0" /> <edge from-layer="47" from-port="2" to-layer="72" to-port="0" /> <edge from-layer="48" from-port="0" to-layer="49" to-port="0" /> <edge from-layer="49" from-port="1" to-layer="57" to-port="0" /> <edge from-layer="50" from-port="1" to-layer="154" to-port="0" /> <edge from-layer="50" from-port="1" to-layer="53" to-port="0" /> <edge from-layer="51" from-port="0" to-layer="53" to-port="1" /> <edge from-layer="52" from-port="0" to-layer="53" to-port="2" /> <edge from-layer="53" from-port="3" to-layer="56" to-port="0" /> <edge from-layer="53" from-port="3" to-layer="161" to-port="0" /> <edge from-layer="53" from-port="3" to-layer="231" to-port="0" /> <edge from-layer="54" from-port="0" to-layer="56" to-port="1" /> <edge from-layer="55" from-port="0" to-layer="56" to-port="2" /> <edge from-layer="56" from-port="3" to-layer="57" to-port="1" /> <edge from-layer="57" from-port="2" to-layer="63" to-port="0" /> <edge from-layer="58" from-port="0" to-layer="59" to-port="1" /> <edge from-layer="59" from-port="2" to-layer="61" to-port="0" /> <edge from-layer="60" from-port="0" to-layer="228" to-port="1" /> <edge from-layer="60" from-port="0" to-layer="61" to-port="1" /> <edge from-layer="60" from-port="0" to-layer="148" to-port="1" /> <edge from-layer="60" from-port="0" to-layer="90" to-port="1" /> <edge from-layer="60" from-port="0" to-layer="71" to-port="1" /> <edge from-layer="61" from-port="2" to-layer="62" to-port="0" /> <edge from-layer="62" from-port="1" to-layer="63" to-port="1" /> <edge from-layer="63" from-port="2" to-layer="65" to-port="0" /> <edge from-layer="64" from-port="0" to-layer="65" to-port="1" /> <edge from-layer="65" from-port="2" to-layer="66" to-port="0" /> <edge from-layer="65" from-port="2" to-layer="66" to-port="1" /> <edge from-layer="66" from-port="2" to-layer="86" to-port="0" /> <edge from-layer="66" from-port="2" to-layer="67" to-port="0" /> <edge from-layer="67" from-port="1" to-layer="70" to-port="0" /> <edge from-layer="68" from-port="0" to-layer="69" to-port="0" /> <edge from-layer="69" from-port="1" to-layer="70" to-port="1" /> <edge from-layer="70" from-port="2" to-layer="71" to-port="0" /> <edge from-layer="71" from-port="2" to-layer="737" to-port="1" /> <edge from-layer="71" from-port="2" to-layer="1127" to-port="1" /> <edge from-layer="71" from-port="2" to-layer="1094" to-port="1" /> <edge from-layer="71" from-port="2" to-layer="997" to-port="1" /> <edge from-layer="71" from-port="2" to-layer="964" to-port="1" /> <edge from-layer="71" from-port="2" to-layer="2276" to-port="1" /> <edge from-layer="71" from-port="2" to-layer="867" to-port="1" /> <edge from-layer="71" from-port="2" to-layer="834" to-port="1" /> <edge from-layer="71" from-port="2" to-layer="444" to-port="1" /> <edge from-layer="71" from-port="2" to-layer="1224" to-port="1" /> <edge from-layer="71" from-port="2" to-layer="704" to-port="1" /> <edge from-layer="71" from-port="2" to-layer="607" to-port="1" /> <edge from-layer="71" from-port="2" to-layer="2309" to-port="1" /> <edge from-layer="71" from-port="2" to-layer="574" to-port="1" /> <edge from-layer="71" from-port="2" to-layer="477" to-port="1" /> <edge from-layer="71" from-port="2" to-layer="1659" to-port="1" /> <edge from-layer="71" from-port="2" to-layer="314" to-port="1" /> <edge from-layer="71" from-port="2" to-layer="2016" to-port="1" /> <edge from-layer="71" from-port="2" to-layer="1919" to-port="1" /> <edge from-layer="71" from-port="2" to-layer="1886" to-port="1" /> <edge from-layer="71" from-port="2" to-layer="2146" to-port="1" /> <edge from-layer="71" from-port="2" to-layer="1789" to-port="1" /> <edge from-layer="71" from-port="2" to-layer="347" to-port="1" /> <edge from-layer="71" from-port="2" to-layer="1756" to-port="1" /> <edge from-layer="71" from-port="2" to-layer="2049" to-port="1" /> <edge from-layer="71" from-port="2" to-layer="1626" to-port="1" /> <edge from-layer="71" from-port="2" to-layer="1529" to-port="1" /> <edge from-layer="71" from-port="2" to-layer="2179" to-port="1" /> <edge from-layer="71" from-port="2" to-layer="1496" to-port="1" /> <edge from-layer="71" from-port="2" to-layer="1419" to-port="1" /> <edge from-layer="71" from-port="2" to-layer="1372" to-port="1" /> <edge from-layer="71" from-port="2" to-layer="1257" to-port="1" /> <edge from-layer="71" from-port="2" to-layer="2959" to-port="1" /> <edge from-layer="71" from-port="2" to-layer="2666" to-port="1" /> <edge from-layer="71" from-port="2" to-layer="3999" to-port="1" /> <edge from-layer="71" from-port="2" to-layer="2699" to-port="1" /> <edge from-layer="71" from-port="2" to-layer="3966" to-port="1" /> <edge from-layer="71" from-port="2" to-layer="2796" to-port="1" /> <edge from-layer="71" from-port="2" to-layer="4321" to-port="1" /> <edge from-layer="71" from-port="2" to-layer="3869" to-port="1" /> <edge from-layer="71" from-port="2" to-layer="2829" to-port="1" /> <edge from-layer="71" from-port="2" to-layer="3836" to-port="1" /> <edge from-layer="71" from-port="2" to-layer="2926" to-port="1" /> <edge from-layer="71" from-port="2" to-layer="3739" to-port="1" /> <edge from-layer="71" from-port="2" to-layer="2406" to-port="1" /> <edge from-layer="71" from-port="2" to-layer="3706" to-port="1" /> <edge from-layer="71" from-port="2" to-layer="3056" to-port="1" /> <edge from-layer="71" from-port="2" to-layer="3609" to-port="1" /> <edge from-layer="71" from-port="2" to-layer="3089" to-port="1" /> <edge from-layer="71" from-port="2" to-layer="3576" to-port="1" /> <edge from-layer="71" from-port="2" to-layer="3186" to-port="1" /> <edge from-layer="71" from-port="2" to-layer="3479" to-port="1" /> <edge from-layer="71" from-port="2" to-layer="3219" to-port="1" /> <edge from-layer="71" from-port="2" to-layer="3446" to-port="1" /> <edge from-layer="71" from-port="2" to-layer="3316" to-port="1" /> <edge from-layer="71" from-port="2" to-layer="3349" to-port="1" /> <edge from-layer="71" from-port="2" to-layer="4244" to-port="1" /> <edge from-layer="71" from-port="2" to-layer="2536" to-port="1" /> <edge from-layer="71" from-port="2" to-layer="72" to-port="1" /> <edge from-layer="71" from-port="2" to-layer="2569" to-port="1" /> <edge from-layer="71" from-port="2" to-layer="2439" to-port="1" /> <edge from-layer="71" from-port="2" to-layer="111" to-port="1" /> <edge from-layer="71" from-port="2" to-layer="4096" to-port="1" /> <edge from-layer="71" from-port="2" to-layer="4129" to-port="1" /> <edge from-layer="72" from-port="2" to-layer="92" to-port="0" /> <edge from-layer="73" from-port="0" to-layer="77" to-port="1" /> <edge from-layer="74" from-port="0" to-layer="77" to-port="2" /> <edge from-layer="75" from-port="0" to-layer="77" to-port="3" /> <edge from-layer="76" from-port="0" to-layer="1430" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="115" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="1423" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="3490" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="3580" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="1383" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="715" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="1376" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="3587" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="845" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="3613" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="3620" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="4107" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="3483" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="878" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="448" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="1500" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="1507" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="708" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="3457" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="871" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="3450" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="455" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="3360" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="1533" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="1540" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="3353" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="4133" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="4140" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="1098" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="122" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="4325" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="1138" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="1131" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="3873" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="3880" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="838" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="1105" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="4332" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="3970" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="3977" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="4255" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="4010" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="1001" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="4003" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="4248" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="4100" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="3847" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="3840" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="1228" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="1235" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="748" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="3750" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="3743" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="975" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="1261" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="1268" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="741" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="1008" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="968" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="3717" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="3710" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="325" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="578" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="2027" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="318" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="2020" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="2807" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="239" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="2833" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="585" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="2800" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="1930" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="1923" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="2280" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="2840" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="2287" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="2930" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="2937" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="1897" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="2150" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="2450" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="2540" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="2547" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="2190" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="2183" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="2573" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="2580" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="2157" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="1890" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="2670" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="2677" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="77" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="2060" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="2053" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="2703" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="2710" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="2443" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="3223" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="2963" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="618" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="2417" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="3190" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="3197" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="351" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="2410" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="1670" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="1663" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="3100" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="3230" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="358" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="2313" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="1637" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="2320" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="1630" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="3320" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="3327" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="481" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="2970" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="1800" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="1793" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="3060" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="488" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="3067" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="611" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="3093" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="84" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="1767" to-port="4" /> <edge from-layer="76" from-port="0" to-layer="1760" to-port="4" /> <edge from-layer="77" from-port="5" to-layer="80" to-port="0" /> <edge from-layer="78" from-port="0" to-layer="79" to-port="0" /> <edge from-layer="79" from-port="1" to-layer="80" to-port="1" /> <edge from-layer="80" from-port="2" to-layer="85" to-port="0" /> <edge from-layer="81" from-port="0" to-layer="84" to-port="1" /> <edge from-layer="82" from-port="0" to-layer="84" to-port="2" /> <edge from-layer="83" from-port="0" to-layer="84" to-port="3" /> <edge from-layer="84" from-port="5" to-layer="85" to-port="1" /> <edge from-layer="85" from-port="2" to-layer="91" to-port="0" /> <edge from-layer="86" from-port="1" to-layer="89" to-port="0" /> <edge from-layer="87" from-port="0" to-layer="88" to-port="0" /> <edge from-layer="88" from-port="1" to-layer="89" to-port="1" /> <edge from-layer="89" from-port="2" to-layer="90" to-port="0" /> <edge from-layer="90" from-port="2" to-layer="490" to-port="1" /> <edge from-layer="90" from-port="2" to-layer="4257" to-port="1" /> <edge from-layer="90" from-port="2" to-layer="750" to-port="1" /> <edge from-layer="90" from-port="2" to-layer="587" to-port="1" /> <edge from-layer="90" from-port="2" to-layer="4334" to-port="1" /> <edge from-layer="90" from-port="2" to-layer="847" to-port="1" /> <edge from-layer="90" from-port="2" to-layer="717" to-port="1" /> <edge from-layer="90" from-port="2" to-layer="620" to-port="1" /> <edge from-layer="90" from-port="2" to-layer="2192" to-port="1" /> <edge from-layer="90" from-port="2" to-layer="2809" to-port="1" /> <edge from-layer="90" from-port="2" to-layer="3232" to-port="1" /> <edge from-layer="90" from-port="2" to-layer="1672" to-port="1" /> <edge from-layer="90" from-port="2" to-layer="3199" to-port="1" /> <edge from-layer="90" from-port="2" to-layer="3102" to-port="1" /> <edge from-layer="90" from-port="2" to-layer="1769" to-port="1" /> <edge from-layer="90" from-port="2" to-layer="3069" to-port="1" /> <edge from-layer="90" from-port="2" to-layer="1802" to-port="1" /> <edge from-layer="90" from-port="2" to-layer="2972" to-port="1" /> <edge from-layer="90" from-port="2" to-layer="2939" to-port="1" /> <edge from-layer="90" from-port="2" to-layer="1899" to-port="1" /> <edge from-layer="90" from-port="2" to-layer="2842" to-port="1" /> <edge from-layer="90" from-port="2" to-layer="1932" to-port="1" /> <edge from-layer="90" from-port="2" to-layer="1639" to-port="1" /> <edge from-layer="90" from-port="2" to-layer="2029" to-port="1" /> <edge from-layer="90" from-port="2" to-layer="2712" to-port="1" /> <edge from-layer="90" from-port="2" to-layer="2062" to-port="1" /> <edge from-layer="90" from-port="2" to-layer="2679" to-port="1" /> <edge from-layer="90" from-port="2" to-layer="2582" to-port="1" /> <edge from-layer="90" from-port="2" to-layer="2159" to-port="1" /> <edge from-layer="90" from-port="2" to-layer="2549" to-port="1" /> <edge from-layer="90" from-port="2" to-layer="2452" to-port="1" /> <edge from-layer="90" from-port="2" to-layer="2289" to-port="1" /> <edge from-layer="90" from-port="2" to-layer="2419" to-port="1" /> <edge from-layer="90" from-port="2" to-layer="2322" to-port="1" /> <edge from-layer="90" from-port="2" to-layer="1270" to-port="1" /> <edge from-layer="90" from-port="2" to-layer="880" to-port="1" /> <edge from-layer="90" from-port="2" to-layer="4109" to-port="1" /> <edge from-layer="90" from-port="2" to-layer="977" to-port="1" /> <edge from-layer="90" from-port="2" to-layer="4012" to-port="1" /> <edge from-layer="90" from-port="2" to-layer="1010" to-port="1" /> <edge from-layer="90" from-port="2" to-layer="3979" to-port="1" /> <edge from-layer="90" from-port="2" to-layer="1107" to-port="1" /> <edge from-layer="90" from-port="2" to-layer="3882" to-port="1" /> <edge from-layer="90" from-port="2" to-layer="1140" to-port="1" /> <edge from-layer="90" from-port="2" to-layer="3849" to-port="1" /> <edge from-layer="90" from-port="2" to-layer="1237" to-port="1" /> <edge from-layer="90" from-port="2" to-layer="3752" to-port="1" /> <edge from-layer="90" from-port="2" to-layer="4142" to-port="1" /> <edge from-layer="90" from-port="2" to-layer="3719" to-port="1" /> <edge from-layer="90" from-port="2" to-layer="3622" to-port="1" /> <edge from-layer="90" from-port="2" to-layer="3589" to-port="1" /> <edge from-layer="90" from-port="2" to-layer="1385" to-port="1" /> <edge from-layer="90" from-port="2" to-layer="3492" to-port="1" /> <edge from-layer="90" from-port="2" to-layer="1432" to-port="1" /> <edge from-layer="90" from-port="2" to-layer="3459" to-port="1" /> <edge from-layer="90" from-port="2" to-layer="1509" to-port="1" /> <edge from-layer="90" from-port="2" to-layer="3362" to-port="1" /> <edge from-layer="90" from-port="2" to-layer="1542" to-port="1" /> <edge from-layer="90" from-port="2" to-layer="3329" to-port="1" /> <edge from-layer="90" from-port="2" to-layer="457" to-port="1" /> <edge from-layer="90" from-port="2" to-layer="360" to-port="1" /> <edge from-layer="90" from-port="2" to-layer="327" to-port="1" /> <edge from-layer="90" from-port="2" to-layer="91" to-port="1" /> <edge from-layer="90" from-port="2" to-layer="124" to-port="1" /> <edge from-layer="91" from-port="2" to-layer="92" to-port="1" /> <edge from-layer="92" from-port="2" to-layer="240" to-port="0" /> <edge from-layer="93" from-port="0" to-layer="94" to-port="0" /> <edge from-layer="94" from-port="1" to-layer="99" to-port="0" /> <edge from-layer="95" from-port="0" to-layer="98" to-port="1" /> <edge from-layer="96" from-port="0" to-layer="98" to-port="2" /> <edge from-layer="97" from-port="0" to-layer="98" to-port="3" /> <edge from-layer="98" from-port="4" to-layer="99" to-port="1" /> <edge from-layer="99" from-port="2" to-layer="100" to-port="0" /> <edge from-layer="100" from-port="1" to-layer="102" to-port="0" /> <edge from-layer="101" from-port="0" to-layer="102" to-port="2" /> <edge from-layer="102" from-port="3" to-layer="176" to-port="0" /> <edge from-layer="102" from-port="3" to-layer="126" to-port="0" /> <edge from-layer="103" from-port="0" to-layer="106" to-port="1" /> <edge from-layer="104" from-port="0" to-layer="106" to-port="2" /> <edge from-layer="105" from-port="0" to-layer="106" to-port="3" /> <edge from-layer="106" from-port="5" to-layer="108" to-port="0" /> <edge from-layer="107" from-port="0" to-layer="108" to-port="1" /> <edge from-layer="108" from-port="2" to-layer="110" to-port="0" /> <edge from-layer="109" from-port="0" to-layer="110" to-port="1" /> <edge from-layer="110" from-port="2" to-layer="122" to-port="0" /> <edge from-layer="110" from-port="2" to-layer="115" to-port="0" /> <edge from-layer="110" from-port="2" to-layer="111" to-port="0" /> <edge from-layer="111" from-port="2" to-layer="125" to-port="0" /> <edge from-layer="112" from-port="0" to-layer="115" to-port="1" /> <edge from-layer="113" from-port="0" to-layer="115" to-port="2" /> <edge from-layer="114" from-port="0" to-layer="115" to-port="3" /> <edge from-layer="115" from-port="5" to-layer="118" to-port="0" /> <edge from-layer="116" from-port="0" to-layer="117" to-port="0" /> <edge from-layer="117" from-port="1" to-layer="118" to-port="1" /> <edge from-layer="118" from-port="2" to-layer="123" to-port="0" /> <edge from-layer="119" from-port="0" to-layer="122" to-port="1" /> <edge from-layer="120" from-port="0" to-layer="122" to-port="2" /> <edge from-layer="121" from-port="0" to-layer="122" to-port="3" /> <edge from-layer="122" from-port="5" to-layer="123" to-port="1" /> <edge from-layer="123" from-port="2" to-layer="124" to-port="0" /> <edge from-layer="124" from-port="2" to-layer="125" to-port="1" /> <edge from-layer="125" from-port="2" to-layer="126" to-port="1" /> <edge from-layer="126" from-port="2" to-layer="4310" to-port="0" /> <edge from-layer="126" from-port="2" to-layer="240" to-port="1" /> <edge from-layer="127" from-port="0" to-layer="128" to-port="0" /> <edge from-layer="128" from-port="1" to-layer="133" to-port="0" /> <edge from-layer="129" from-port="0" to-layer="132" to-port="1" /> <edge from-layer="130" from-port="0" to-layer="132" to-port="2" /> <edge from-layer="131" from-port="0" to-layer="132" to-port="3" /> <edge from-layer="132" from-port="4" to-layer="133" to-port="1" /> <edge from-layer="133" from-port="2" to-layer="134" to-port="0" /> <edge from-layer="134" from-port="1" to-layer="136" to-port="0" /> <edge from-layer="135" from-port="0" to-layer="136" to-port="2" /> <edge from-layer="136" from-port="3" to-layer="145" to-port="0" /> <edge from-layer="137" from-port="0" to-layer="140" to-port="1" /> <edge from-layer="138" from-port="0" to-layer="140" to-port="2" /> <edge from-layer="139" from-port="0" to-layer="140" to-port="3" /> <edge from-layer="140" from-port="5" to-layer="142" to-port="0" /> <edge from-layer="141" from-port="0" to-layer="142" to-port="1" /> <edge from-layer="142" from-port="2" to-layer="144" to-port="0" /> <edge from-layer="143" from-port="0" to-layer="144" to-port="1" /> <edge from-layer="144" from-port="2" to-layer="145" to-port="1" /> <edge from-layer="145" from-port="2" to-layer="240" to-port="2" /> <edge from-layer="145" from-port="2" to-layer="4309" to-port="0" /> <edge from-layer="146" from-port="0" to-layer="147" to-port="0" /> <edge from-layer="147" from-port="1" to-layer="167" to-port="0" /> <edge from-layer="148" from-port="2" to-layer="150" to-port="0" /> <edge from-layer="149" from-port="0" to-layer="150" to-port="1" /> <edge from-layer="150" from-port="2" to-layer="162" to-port="0" /> <edge from-layer="151" from-port="0" to-layer="161" to-port="1" /> <edge from-layer="152" from-port="0" to-layer="154" to-port="1" /> <edge from-layer="153" from-port="0" to-layer="154" to-port="2" /> <edge from-layer="154" from-port="3" to-layer="180" to-port="0" /> <edge from-layer="154" from-port="3" to-layer="156" to-port="0" /> <edge from-layer="154" from-port="3" to-layer="181" to-port="1" /> <edge from-layer="154" from-port="3" to-layer="205" to-port="1" /> <edge from-layer="154" from-port="3" to-layer="190" to-port="0" /> <edge from-layer="155" from-port="0" to-layer="156" to-port="1" /> <edge from-layer="156" from-port="2" to-layer="184" to-port="0" /> <edge from-layer="156" from-port="2" to-layer="231" to-port="2" /> <edge from-layer="156" from-port="2" to-layer="230" to-port="0" /> <edge from-layer="156" from-port="2" to-layer="237" to-port="1" /> <edge from-layer="156" from-port="2" to-layer="215" to-port="0" /> <edge from-layer="156" from-port="2" to-layer="161" to-port="2" /> <edge from-layer="157" from-port="1" to-layer="160" to-port="0" /> <edge from-layer="158" from-port="0" to-layer="160" to-port="1" /> <edge from-layer="159" from-port="0" to-layer="160" to-port="2" /> <edge from-layer="160" from-port="3" to-layer="161" to-port="3" /> <edge from-layer="161" from-port="4" to-layer="162" to-port="1" /> <edge from-layer="162" from-port="2" to-layer="163" to-port="0" /> <edge from-layer="163" from-port="1" to-layer="166" to-port="0" /> <edge from-layer="164" from-port="0" to-layer="165" to-port="0" /> <edge from-layer="165" from-port="1" to-layer="166" to-port="1" /> <edge from-layer="166" from-port="2" to-layer="167" to-port="1" /> <edge from-layer="167" from-port="2" to-layer="170" to-port="2" /> <edge from-layer="167" from-port="2" to-layer="168" to-port="0" /> <edge from-layer="168" from-port="1" to-layer="170" to-port="0" /> <edge from-layer="169" from-port="0" to-layer="225" to-port="1" /> <edge from-layer="169" from-port="0" to-layer="216" to-port="0" /> <edge from-layer="169" from-port="0" to-layer="170" to-port="1" /> <edge from-layer="169" from-port="0" to-layer="233" to-port="1" /> <edge from-layer="170" from-port="3" to-layer="171" to-port="0" /> <edge from-layer="171" from-port="1" to-layer="233" to-port="0" /> <edge from-layer="172" from-port="0" to-layer="223" to-port="0" /> <edge from-layer="173" from-port="0" to-layer="193" to-port="0" /> <edge from-layer="173" from-port="0" to-layer="194" to-port="1" /> <edge from-layer="174" from-port="0" to-layer="175" to-port="0" /> <edge from-layer="175" from-port="1" to-layer="185" to-port="0" /> <edge from-layer="176" from-port="1" to-layer="179" to-port="0" /> <edge from-layer="177" from-port="0" to-layer="179" to-port="1" /> <edge from-layer="178" from-port="0" to-layer="179" to-port="2" /> <edge from-layer="179" from-port="3" to-layer="236" to-port="0" /> <edge from-layer="179" from-port="3" to-layer="180" to-port="1" /> <edge from-layer="180" from-port="2" to-layer="181" to-port="0" /> <edge from-layer="181" from-port="2" to-layer="183" to-port="0" /> <edge from-layer="181" from-port="2" to-layer="196" to-port="0" /> <edge from-layer="182" from-port="0" to-layer="183" to-port="1" /> <edge from-layer="183" from-port="2" to-layer="230" to-port="1" /> <edge from-layer="183" from-port="2" to-layer="184" to-port="1" /> <edge from-layer="184" from-port="2" to-layer="185" to-port="1" /> <edge from-layer="185" from-port="2" to-layer="186" to-port="0" /> <edge from-layer="185" from-port="2" to-layer="218" to-port="0" /> <edge from-layer="186" from-port="1" to-layer="189" to-port="0" /> <edge from-layer="187" from-port="0" to-layer="189" to-port="1" /> <edge from-layer="188" from-port="0" to-layer="189" to-port="2" /> <edge from-layer="189" from-port="3" to-layer="191" to-port="0" /> <edge from-layer="190" from-port="1" to-layer="198" to-port="0" /> <edge from-layer="190" from-port="1" to-layer="191" to-port="1" /> <edge from-layer="191" from-port="2" to-layer="193" to-port="1" /> <edge from-layer="192" from-port="0" to-layer="199" to-port="2" /> <edge from-layer="192" from-port="0" to-layer="193" to-port="2" /> <edge from-layer="192" from-port="0" to-layer="200" to-port="1" /> <edge from-layer="193" from-port="3" to-layer="194" to-port="0" /> <edge from-layer="194" from-port="2" to-layer="201" to-port="0" /> <edge from-layer="195" from-port="0" to-layer="196" to-port="1" /> <edge from-layer="196" from-port="2" to-layer="197" to-port="0" /> <edge from-layer="197" from-port="1" to-layer="198" to-port="1" /> <edge from-layer="197" from-port="1" to-layer="199" to-port="0" /> <edge from-layer="198" from-port="2" to-layer="199" to-port="1" /> <edge from-layer="199" from-port="3" to-layer="200" to-port="0" /> <edge from-layer="200" from-port="2" to-layer="201" to-port="1" /> <edge from-layer="201" from-port="2" to-layer="222" to-port="0" /> <edge from-layer="202" from-port="0" to-layer="220" to-port="0" /> <edge from-layer="203" from-port="0" to-layer="205" to-port="0" /> <edge from-layer="204" from-port="0" to-layer="205" to-port="2" /> <edge from-layer="205" from-port="3" to-layer="206" to-port="0" /> <edge from-layer="206" from-port="1" to-layer="208" to-port="0" /> <edge from-layer="206" from-port="1" to-layer="211" to-port="0" /> <edge from-layer="207" from-port="0" to-layer="208" to-port="1" /> <edge from-layer="208" from-port="2" to-layer="210" to-port="0" /> <edge from-layer="209" from-port="0" to-layer="210" to-port="1" /> <edge from-layer="210" from-port="2" to-layer="211" to-port="1" /> <edge from-layer="211" from-port="2" to-layer="217" to-port="0" /> <edge from-layer="212" from-port="0" to-layer="213" to-port="0" /> <edge from-layer="213" from-port="1" to-layer="217" to-port="1" /> <edge from-layer="214" from-port="0" to-layer="215" to-port="1" /> <edge from-layer="215" from-port="2" to-layer="216" to-port="1" /> <edge from-layer="216" from-port="2" to-layer="217" to-port="2" /> <edge from-layer="217" from-port="3" to-layer="218" to-port="1" /> <edge from-layer="218" from-port="2" to-layer="225" to-port="2" /> <edge from-layer="218" from-port="2" to-layer="219" to-port="0" /> <edge from-layer="219" from-port="1" to-layer="220" to-port="1" /> <edge from-layer="220" from-port="2" to-layer="222" to-port="1" /> <edge from-layer="221" from-port="0" to-layer="222" to-port="2" /> <edge from-layer="222" from-port="3" to-layer="223" to-port="1" /> <edge from-layer="223" from-port="2" to-layer="224" to-port="0" /> <edge from-layer="224" from-port="1" to-layer="225" to-port="0" /> <edge from-layer="225" from-port="3" to-layer="227" to-port="0" /> <edge from-layer="226" from-port="0" to-layer="227" to-port="1" /> <edge from-layer="227" from-port="2" to-layer="228" to-port="0" /> <edge from-layer="228" from-port="2" to-layer="232" to-port="0" /> <edge from-layer="229" from-port="0" to-layer="231" to-port="1" /> <edge from-layer="230" from-port="2" to-layer="231" to-port="3" /> <edge from-layer="231" from-port="4" to-layer="232" to-port="1" /> <edge from-layer="232" from-port="2" to-layer="233" to-port="2" /> <edge from-layer="233" from-port="3" to-layer="239" to-port="0" /> <edge from-layer="234" from-port="0" to-layer="239" to-port="1" /> <edge from-layer="235" from-port="0" to-layer="236" to-port="1" /> <edge from-layer="236" from-port="2" to-layer="237" to-port="0" /> <edge from-layer="237" from-port="2" to-layer="239" to-port="2" /> <edge from-layer="238" from-port="0" to-layer="239" to-port="3" /> <edge from-layer="239" from-port="5" to-layer="382" to-port="3" /> <edge from-layer="239" from-port="5" to-layer="2474" to-port="3" /> <edge from-layer="239" from-port="5" to-layer="1434" to-port="3" /> <edge from-layer="239" from-port="5" to-layer="642" to-port="3" /> <edge from-layer="239" from-port="5" to-layer="3774" to-port="3" /> <edge from-layer="239" from-port="5" to-layer="240" to-port="3" /> <edge from-layer="239" from-port="5" to-layer="1292" to-port="3" /> <edge from-layer="239" from-port="5" to-layer="1162" to-port="3" /> <edge from-layer="239" from-port="5" to-layer="2734" to-port="3" /> <edge from-layer="239" from-port="5" to-layer="1032" to-port="3" /> <edge from-layer="239" from-port="5" to-layer="902" to-port="3" /> <edge from-layer="239" from-port="5" to-layer="2864" to-port="3" /> <edge from-layer="239" from-port="5" to-layer="3384" to-port="3" /> <edge from-layer="239" from-port="5" to-layer="772" to-port="3" /> <edge from-layer="239" from-port="5" to-layer="4164" to-port="3" /> <edge from-layer="239" from-port="5" to-layer="2344" to-port="3" /> <edge from-layer="239" from-port="5" to-layer="2214" to-port="3" /> <edge from-layer="239" from-port="5" to-layer="2084" to-port="3" /> <edge from-layer="239" from-port="5" to-layer="1564" to-port="3" /> <edge from-layer="239" from-port="5" to-layer="3254" to-port="3" /> <edge from-layer="239" from-port="5" to-layer="4336" to-port="3" /> <edge from-layer="239" from-port="5" to-layer="3514" to-port="3" /> <edge from-layer="239" from-port="5" to-layer="1954" to-port="3" /> <edge from-layer="239" from-port="5" to-layer="3124" to-port="3" /> <edge from-layer="239" from-port="5" to-layer="512" to-port="3" /> <edge from-layer="239" from-port="5" to-layer="1694" to-port="3" /> <edge from-layer="239" from-port="5" to-layer="3644" to-port="3" /> <edge from-layer="239" from-port="5" to-layer="2994" to-port="3" /> <edge from-layer="239" from-port="5" to-layer="1824" to-port="3" /> <edge from-layer="239" from-port="5" to-layer="3904" to-port="3" /> <edge from-layer="239" from-port="5" to-layer="4034" to-port="3" /> <edge from-layer="239" from-port="5" to-layer="2604" to-port="3" /> <edge from-layer="240" from-port="4" to-layer="242" to-port="0" /> <edge from-layer="241" from-port="0" to-layer="242" to-port="1" /> <edge from-layer="242" from-port="2" to-layer="244" to-port="0" /> <edge from-layer="243" from-port="0" to-layer="244" to-port="1" /> <edge from-layer="244" from-port="2" to-layer="247" to-port="0" /> <edge from-layer="245" from-port="0" to-layer="246" to-port="0" /> <edge from-layer="246" from-port="1" to-layer="247" to-port="1" /> <edge from-layer="247" from-port="2" to-layer="248" to-port="1" /> <edge from-layer="248" from-port="2" to-layer="286" to-port="0" /> <edge from-layer="248" from-port="2" to-layer="255" to-port="0" /> <edge from-layer="248" from-port="2" to-layer="263" to-port="0" /> <edge from-layer="249" from-port="0" to-layer="250" to-port="0" /> <edge from-layer="250" from-port="1" to-layer="264" to-port="0" /> <edge from-layer="251" from-port="0" to-layer="252" to-port="0" /> <edge from-layer="252" from-port="1" to-layer="262" to-port="0" /> <edge from-layer="253" from-port="0" to-layer="254" to-port="0" /> <edge from-layer="254" from-port="1" to-layer="255" to-port="1" /> <edge from-layer="255" from-port="2" to-layer="257" to-port="0" /> <edge from-layer="256" from-port="0" to-layer="257" to-port="1" /> <edge from-layer="257" from-port="2" to-layer="260" to-port="0" /> <edge from-layer="258" from-port="0" to-layer="259" to-port="0" /> <edge from-layer="259" from-port="1" to-layer="260" to-port="1" /> <edge from-layer="260" from-port="2" to-layer="261" to-port="0" /> <edge from-layer="261" from-port="1" to-layer="262" to-port="1" /> <edge from-layer="262" from-port="2" to-layer="263" to-port="1" /> <edge from-layer="263" from-port="2" to-layer="264" to-port="1" /> <edge from-layer="264" from-port="2" to-layer="267" to-port="0" /> <edge from-layer="265" from-port="0" to-layer="266" to-port="0" /> <edge from-layer="266" from-port="1" to-layer="267" to-port="1" /> <edge from-layer="267" from-port="2" to-layer="280" to-port="0" /> <edge from-layer="267" from-port="2" to-layer="269" to-port="0" /> <edge from-layer="268" from-port="0" to-layer="2372" to-port="1" /> <edge from-layer="268" from-port="0" to-layer="930" to-port="1" /> <edge from-layer="268" from-port="0" to-layer="2242" to-port="1" /> <edge from-layer="268" from-port="0" to-layer="271" to-port="1" /> <edge from-layer="268" from-port="0" to-layer="280" to-port="1" /> <edge from-layer="268" from-port="0" to-layer="4192" to-port="1" /> <edge from-layer="268" from-port="0" to-layer="4364" to-port="1" /> <edge from-layer="268" from-port="0" to-layer="1060" to-port="1" /> <edge from-layer="268" from-port="0" to-layer="410" to-port="1" /> <edge from-layer="268" from-port="0" to-layer="1190" to-port="1" /> <edge from-layer="268" from-port="0" to-layer="1320" to-port="1" /> <edge from-layer="268" from-port="0" to-layer="1462" to-port="1" /> <edge from-layer="268" from-port="0" to-layer="1592" to-port="1" /> <edge from-layer="268" from-port="0" to-layer="1722" to-port="1" /> <edge from-layer="268" from-port="0" to-layer="800" to-port="1" /> <edge from-layer="268" from-port="0" to-layer="1852" to-port="1" /> <edge from-layer="268" from-port="0" to-layer="1982" to-port="1" /> <edge from-layer="268" from-port="0" to-layer="2112" to-port="1" /> <edge from-layer="268" from-port="0" to-layer="4062" to-port="1" /> <edge from-layer="268" from-port="0" to-layer="2892" to-port="1" /> <edge from-layer="268" from-port="0" to-layer="3542" to-port="1" /> <edge from-layer="268" from-port="0" to-layer="2762" to-port="1" /> <edge from-layer="268" from-port="0" to-layer="3672" to-port="1" /> <edge from-layer="268" from-port="0" to-layer="2632" to-port="1" /> <edge from-layer="268" from-port="0" to-layer="3802" to-port="1" /> <edge from-layer="268" from-port="0" to-layer="3932" to-port="1" /> <edge from-layer="268" from-port="0" to-layer="540" to-port="1" /> <edge from-layer="268" from-port="0" to-layer="3282" to-port="1" /> <edge from-layer="268" from-port="0" to-layer="670" to-port="1" /> <edge from-layer="268" from-port="0" to-layer="2502" to-port="1" /> <edge from-layer="268" from-port="0" to-layer="3152" to-port="1" /> <edge from-layer="268" from-port="0" to-layer="3412" to-port="1" /> <edge from-layer="268" from-port="0" to-layer="3022" to-port="1" /> <edge from-layer="269" from-port="1" to-layer="271" to-port="0" /> <edge from-layer="270" from-port="0" to-layer="271" to-port="2" /> <edge from-layer="270" from-port="0" to-layer="275" to-port="1" /> <edge from-layer="271" from-port="3" to-layer="273" to-port="0" /> <edge from-layer="271" from-port="3" to-layer="274" to-port="0" /> <edge from-layer="272" from-port="0" to-layer="273" to-port="1" /> <edge from-layer="272" from-port="0" to-layer="274" to-port="1" /> <edge from-layer="273" from-port="2" to-layer="277" to-port="0" /> <edge from-layer="274" from-port="2" to-layer="275" to-port="0" /> <edge from-layer="275" from-port="2" to-layer="276" to-port="0" /> <edge from-layer="276" from-port="1" to-layer="277" to-port="1" /> <edge from-layer="277" from-port="2" to-layer="279" to-port="0" /> <edge from-layer="278" from-port="0" to-layer="279" to-port="1" /> <edge from-layer="279" from-port="2" to-layer="1852" to-port="2" /> <edge from-layer="279" from-port="2" to-layer="2112" to-port="2" /> <edge from-layer="279" from-port="2" to-layer="930" to-port="2" /> <edge from-layer="279" from-port="2" to-layer="3932" to-port="2" /> <edge from-layer="279" from-port="2" to-layer="2372" to-port="2" /> <edge from-layer="279" from-port="2" to-layer="3412" to-port="2" /> <edge from-layer="279" from-port="2" to-layer="2502" to-port="2" /> <edge from-layer="279" from-port="2" to-layer="280" to-port="2" /> <edge from-layer="279" from-port="2" to-layer="3022" to-port="2" /> <edge from-layer="279" from-port="2" to-layer="540" to-port="2" /> <edge from-layer="279" from-port="2" to-layer="4192" to-port="2" /> <edge from-layer="279" from-port="2" to-layer="3282" to-port="2" /> <edge from-layer="279" from-port="2" to-layer="670" to-port="2" /> <edge from-layer="279" from-port="2" to-layer="1982" to-port="2" /> <edge from-layer="279" from-port="2" to-layer="2242" to-port="2" /> <edge from-layer="279" from-port="2" to-layer="3152" to-port="2" /> <edge from-layer="279" from-port="2" to-layer="800" to-port="2" /> <edge from-layer="279" from-port="2" to-layer="1320" to-port="2" /> <edge from-layer="279" from-port="2" to-layer="1462" to-port="2" /> <edge from-layer="279" from-port="2" to-layer="2892" to-port="2" /> <edge from-layer="279" from-port="2" to-layer="3542" to-port="2" /> <edge from-layer="279" from-port="2" to-layer="1592" to-port="2" /> <edge from-layer="279" from-port="2" to-layer="1190" to-port="2" /> <edge from-layer="279" from-port="2" to-layer="2632" to-port="2" /> <edge from-layer="279" from-port="2" to-layer="2762" to-port="2" /> <edge from-layer="279" from-port="2" to-layer="3672" to-port="2" /> <edge from-layer="279" from-port="2" to-layer="1722" to-port="2" /> <edge from-layer="279" from-port="2" to-layer="4364" to-port="2" /> <edge from-layer="279" from-port="2" to-layer="4062" to-port="2" /> <edge from-layer="279" from-port="2" to-layer="410" to-port="2" /> <edge from-layer="279" from-port="2" to-layer="1060" to-port="2" /> <edge from-layer="279" from-port="2" to-layer="3802" to-port="2" /> <edge from-layer="280" from-port="3" to-layer="281" to-port="0" /> <edge from-layer="280" from-port="4" to-layer="282" to-port="0" /> <edge from-layer="281" from-port="1" to-layer="282" to-port="1" /> <edge from-layer="282" from-port="2" to-layer="285" to-port="0" /> <edge from-layer="283" from-port="0" to-layer="284" to-port="0" /> <edge from-layer="284" from-port="1" to-layer="285" to-port="1" /> <edge from-layer="285" from-port="2" to-layer="286" to-port="1" /> <edge from-layer="286" from-port="2" to-layer="390" to-port="0" /> <edge from-layer="286" from-port="2" to-layer="301" to-port="0" /> <edge from-layer="286" from-port="2" to-layer="293" to-port="0" /> <edge from-layer="287" from-port="0" to-layer="288" to-port="0" /> <edge from-layer="288" from-port="1" to-layer="302" to-port="0" /> <edge from-layer="289" from-port="0" to-layer="290" to-port="0" /> <edge from-layer="290" from-port="1" to-layer="300" to-port="0" /> <edge from-layer="291" from-port="0" to-layer="292" to-port="0" /> <edge from-layer="292" from-port="1" to-layer="293" to-port="1" /> <edge from-layer="293" from-port="2" to-layer="295" to-port="0" /> <edge from-layer="294" from-port="0" to-layer="295" to-port="1" /> <edge from-layer="295" from-port="2" to-layer="298" to-port="0" /> <edge from-layer="296" from-port="0" to-layer="297" to-port="0" /> <edge from-layer="297" from-port="1" to-layer="298" to-port="1" /> <edge from-layer="298" from-port="2" to-layer="299" to-port="0" /> <edge from-layer="299" from-port="1" to-layer="300" to-port="1" /> <edge from-layer="300" from-port="2" to-layer="301" to-port="1" /> <edge from-layer="301" from-port="2" to-layer="302" to-port="1" /> <edge from-layer="302" from-port="2" to-layer="305" to-port="0" /> <edge from-layer="303" from-port="0" to-layer="304" to-port="0" /> <edge from-layer="304" from-port="1" to-layer="305" to-port="1" /> <edge from-layer="305" from-port="2" to-layer="376" to-port="0" /> <edge from-layer="305" from-port="2" to-layer="342" to-port="0" /> <edge from-layer="305" from-port="2" to-layer="309" to-port="0" /> <edge from-layer="306" from-port="0" to-layer="309" to-port="1" /> <edge from-layer="307" from-port="0" to-layer="309" to-port="2" /> <edge from-layer="308" from-port="0" to-layer="309" to-port="3" /> <edge from-layer="309" from-port="5" to-layer="311" to-port="0" /> <edge from-layer="310" from-port="0" to-layer="311" to-port="1" /> <edge from-layer="311" from-port="2" to-layer="313" to-port="0" /> <edge from-layer="312" from-port="0" to-layer="313" to-port="1" /> <edge from-layer="313" from-port="2" to-layer="325" to-port="0" /> <edge from-layer="313" from-port="2" to-layer="318" to-port="0" /> <edge from-layer="313" from-port="2" to-layer="314" to-port="0" /> <edge from-layer="314" from-port="2" to-layer="328" to-port="0" /> <edge from-layer="315" from-port="0" to-layer="318" to-port="1" /> <edge from-layer="316" from-port="0" to-layer="318" to-port="2" /> <edge from-layer="317" from-port="0" to-layer="318" to-port="3" /> <edge from-layer="318" from-port="5" to-layer="321" to-port="0" /> <edge from-layer="319" from-port="0" to-layer="320" to-port="0" /> <edge from-layer="320" from-port="1" to-layer="321" to-port="1" /> <edge from-layer="321" from-port="2" to-layer="326" to-port="0" /> <edge from-layer="322" from-port="0" to-layer="325" to-port="1" /> <edge from-layer="323" from-port="0" to-layer="325" to-port="2" /> <edge from-layer="324" from-port="0" to-layer="325" to-port="3" /> <edge from-layer="325" from-port="5" to-layer="326" to-port="1" /> <edge from-layer="326" from-port="2" to-layer="327" to-port="0" /> <edge from-layer="327" from-port="2" to-layer="328" to-port="1" /> <edge from-layer="328" from-port="2" to-layer="382" to-port="0" /> <edge from-layer="329" from-port="0" to-layer="330" to-port="0" /> <edge from-layer="330" from-port="1" to-layer="335" to-port="0" /> <edge from-layer="331" from-port="0" to-layer="334" to-port="1" /> <edge from-layer="332" from-port="0" to-layer="334" to-port="2" /> <edge from-layer="333" from-port="0" to-layer="334" to-port="3" /> <edge from-layer="334" from-port="4" to-layer="335" to-port="1" /> <edge from-layer="335" from-port="2" to-layer="336" to-port="0" /> <edge from-layer="336" from-port="1" to-layer="338" to-port="0" /> <edge from-layer="337" from-port="0" to-layer="338" to-port="2" /> <edge from-layer="338" from-port="3" to-layer="362" to-port="0" /> <edge from-layer="339" from-port="0" to-layer="342" to-port="1" /> <edge from-layer="340" from-port="0" to-layer="342" to-port="2" /> <edge from-layer="341" from-port="0" to-layer="342" to-port="3" /> <edge from-layer="342" from-port="5" to-layer="344" to-port="0" /> <edge from-layer="343" from-port="0" to-layer="344" to-port="1" /> <edge from-layer="344" from-port="2" to-layer="346" to-port="0" /> <edge from-layer="345" from-port="0" to-layer="346" to-port="1" /> <edge from-layer="346" from-port="2" to-layer="347" to-port="0" /> <edge from-layer="346" from-port="2" to-layer="351" to-port="0" /> <edge from-layer="346" from-port="2" to-layer="358" to-port="0" /> <edge from-layer="347" from-port="2" to-layer="361" to-port="0" /> <edge from-layer="348" from-port="0" to-layer="351" to-port="1" /> <edge from-layer="349" from-port="0" to-layer="351" to-port="2" /> <edge from-layer="350" from-port="0" to-layer="351" to-port="3" /> <edge from-layer="351" from-port="5" to-layer="354" to-port="0" /> <edge from-layer="352" from-port="0" to-layer="353" to-port="0" /> <edge from-layer="353" from-port="1" to-layer="354" to-port="1" /> <edge from-layer="354" from-port="2" to-layer="359" to-port="0" /> <edge from-layer="355" from-port="0" to-layer="358" to-port="1" /> <edge from-layer="356" from-port="0" to-layer="358" to-port="2" /> <edge from-layer="357" from-port="0" to-layer="358" to-port="3" /> <edge from-layer="358" from-port="5" to-layer="359" to-port="1" /> <edge from-layer="359" from-port="2" to-layer="360" to-port="0" /> <edge from-layer="360" from-port="2" to-layer="361" to-port="1" /> <edge from-layer="361" from-port="2" to-layer="362" to-port="1" /> <edge from-layer="362" from-port="2" to-layer="382" to-port="1" /> <edge from-layer="362" from-port="2" to-layer="4308" to-port="0" /> <edge from-layer="363" from-port="0" to-layer="364" to-port="0" /> <edge from-layer="364" from-port="1" to-layer="369" to-port="0" /> <edge from-layer="365" from-port="0" to-layer="368" to-port="1" /> <edge from-layer="366" from-port="0" to-layer="368" to-port="2" /> <edge from-layer="367" from-port="0" to-layer="368" to-port="3" /> <edge from-layer="368" from-port="4" to-layer="369" to-port="1" /> <edge from-layer="369" from-port="2" to-layer="370" to-port="0" /> <edge from-layer="370" from-port="1" to-layer="372" to-port="0" /> <edge from-layer="371" from-port="0" to-layer="372" to-port="2" /> <edge from-layer="372" from-port="3" to-layer="381" to-port="0" /> <edge from-layer="373" from-port="0" to-layer="376" to-port="1" /> <edge from-layer="374" from-port="0" to-layer="376" to-port="2" /> <edge from-layer="375" from-port="0" to-layer="376" to-port="3" /> <edge from-layer="376" from-port="5" to-layer="378" to-port="0" /> <edge from-layer="377" from-port="0" to-layer="378" to-port="1" /> <edge from-layer="378" from-port="2" to-layer="380" to-port="0" /> <edge from-layer="379" from-port="0" to-layer="380" to-port="1" /> <edge from-layer="380" from-port="2" to-layer="381" to-port="1" /> <edge from-layer="381" from-port="2" to-layer="382" to-port="2" /> <edge from-layer="381" from-port="2" to-layer="4307" to-port="0" /> <edge from-layer="382" from-port="4" to-layer="384" to-port="0" /> <edge from-layer="383" from-port="0" to-layer="384" to-port="1" /> <edge from-layer="384" from-port="2" to-layer="386" to-port="0" /> <edge from-layer="385" from-port="0" to-layer="386" to-port="1" /> <edge from-layer="386" from-port="2" to-layer="389" to-port="0" /> <edge from-layer="387" from-port="0" to-layer="388" to-port="0" /> <edge from-layer="388" from-port="1" to-layer="389" to-port="1" /> <edge from-layer="389" from-port="2" to-layer="390" to-port="1" /> <edge from-layer="390" from-port="2" to-layer="397" to-port="0" /> <edge from-layer="390" from-port="2" to-layer="405" to-port="0" /> <edge from-layer="390" from-port="2" to-layer="416" to-port="0" /> <edge from-layer="391" from-port="0" to-layer="392" to-port="0" /> <edge from-layer="392" from-port="1" to-layer="406" to-port="0" /> <edge from-layer="393" from-port="0" to-layer="394" to-port="0" /> <edge from-layer="394" from-port="1" to-layer="404" to-port="0" /> <edge from-layer="395" from-port="0" to-layer="396" to-port="0" /> <edge from-layer="396" from-port="1" to-layer="397" to-port="1" /> <edge from-layer="397" from-port="2" to-layer="399" to-port="0" /> <edge from-layer="398" from-port="0" to-layer="399" to-port="1" /> <edge from-layer="399" from-port="2" to-layer="402" to-port="0" /> <edge from-layer="400" from-port="0" to-layer="401" to-port="0" /> <edge from-layer="401" from-port="1" to-layer="402" to-port="1" /> <edge from-layer="402" from-port="2" to-layer="403" to-port="0" /> <edge from-layer="403" from-port="1" to-layer="404" to-port="1" /> <edge from-layer="404" from-port="2" to-layer="405" to-port="1" /> <edge from-layer="405" from-port="2" to-layer="406" to-port="1" /> <edge from-layer="406" from-port="2" to-layer="409" to-port="0" /> <edge from-layer="407" from-port="0" to-layer="408" to-port="0" /> <edge from-layer="408" from-port="1" to-layer="409" to-port="1" /> <edge from-layer="409" from-port="2" to-layer="410" to-port="0" /> <edge from-layer="410" from-port="3" to-layer="411" to-port="0" /> <edge from-layer="410" from-port="4" to-layer="412" to-port="0" /> <edge from-layer="411" from-port="1" to-layer="412" to-port="1" /> <edge from-layer="412" from-port="2" to-layer="415" to-port="0" /> <edge from-layer="413" from-port="0" to-layer="414" to-port="0" /> <edge from-layer="414" from-port="1" to-layer="415" to-port="1" /> <edge from-layer="415" from-port="2" to-layer="416" to-port="1" /> <edge from-layer="416" from-port="2" to-layer="423" to-port="0" /> <edge from-layer="416" from-port="2" to-layer="431" to-port="0" /> <edge from-layer="416" from-port="2" to-layer="520" to-port="0" /> <edge from-layer="417" from-port="0" to-layer="418" to-port="0" /> <edge from-layer="418" from-port="1" to-layer="432" to-port="0" /> <edge from-layer="419" from-port="0" to-layer="420" to-port="0" /> <edge from-layer="420" from-port="1" to-layer="430" to-port="0" /> <edge from-layer="421" from-port="0" to-layer="422" to-port="0" /> <edge from-layer="422" from-port="1" to-layer="423" to-port="1" /> <edge from-layer="423" from-port="2" to-layer="425" to-port="0" /> <edge from-layer="424" from-port="0" to-layer="425" to-port="1" /> <edge from-layer="425" from-port="2" to-layer="428" to-port="0" /> <edge from-layer="426" from-port="0" to-layer="427" to-port="0" /> <edge from-layer="427" from-port="1" to-layer="428" to-port="1" /> <edge from-layer="428" from-port="2" to-layer="429" to-port="0" /> <edge from-layer="429" from-port="1" to-layer="430" to-port="1" /> <edge from-layer="430" from-port="2" to-layer="431" to-port="1" /> <edge from-layer="431" from-port="2" to-layer="432" to-port="1" /> <edge from-layer="432" from-port="2" to-layer="435" to-port="0" /> <edge from-layer="433" from-port="0" to-layer="434" to-port="0" /> <edge from-layer="434" from-port="1" to-layer="435" to-port="1" /> <edge from-layer="435" from-port="2" to-layer="506" to-port="0" /> <edge from-layer="435" from-port="2" to-layer="439" to-port="0" /> <edge from-layer="435" from-port="2" to-layer="472" to-port="0" /> <edge from-layer="436" from-port="0" to-layer="439" to-port="1" /> <edge from-layer="437" from-port="0" to-layer="439" to-port="2" /> <edge from-layer="438" from-port="0" to-layer="439" to-port="3" /> <edge from-layer="439" from-port="5" to-layer="441" to-port="0" /> <edge from-layer="440" from-port="0" to-layer="441" to-port="1" /> <edge from-layer="441" from-port="2" to-layer="443" to-port="0" /> <edge from-layer="442" from-port="0" to-layer="443" to-port="1" /> <edge from-layer="443" from-port="2" to-layer="448" to-port="0" /> <edge from-layer="443" from-port="2" to-layer="444" to-port="0" /> <edge from-layer="443" from-port="2" to-layer="455" to-port="0" /> <edge from-layer="444" from-port="2" to-layer="458" to-port="0" /> <edge from-layer="445" from-port="0" to-layer="448" to-port="1" /> <edge from-layer="446" from-port="0" to-layer="448" to-port="2" /> <edge from-layer="447" from-port="0" to-layer="448" to-port="3" /> <edge from-layer="448" from-port="5" to-layer="451" to-port="0" /> <edge from-layer="449" from-port="0" to-layer="450" to-port="0" /> <edge from-layer="450" from-port="1" to-layer="451" to-port="1" /> <edge from-layer="451" from-port="2" to-layer="456" to-port="0" /> <edge from-layer="452" from-port="0" to-layer="455" to-port="1" /> <edge from-layer="453" from-port="0" to-layer="455" to-port="2" /> <edge from-layer="454" from-port="0" to-layer="455" to-port="3" /> <edge from-layer="455" from-port="5" to-layer="456" to-port="1" /> <edge from-layer="456" from-port="2" to-layer="457" to-port="0" /> <edge from-layer="457" from-port="2" to-layer="458" to-port="1" /> <edge from-layer="458" from-port="2" to-layer="512" to-port="0" /> <edge from-layer="459" from-port="0" to-layer="460" to-port="0" /> <edge from-layer="460" from-port="1" to-layer="465" to-port="0" /> <edge from-layer="461" from-port="0" to-layer="464" to-port="1" /> <edge from-layer="462" from-port="0" to-layer="464" to-port="2" /> <edge from-layer="463" from-port="0" to-layer="464" to-port="3" /> <edge from-layer="464" from-port="4" to-layer="465" to-port="1" /> <edge from-layer="465" from-port="2" to-layer="466" to-port="0" /> <edge from-layer="466" from-port="1" to-layer="468" to-port="0" /> <edge from-layer="467" from-port="0" to-layer="468" to-port="2" /> <edge from-layer="468" from-port="3" to-layer="492" to-port="0" /> <edge from-layer="469" from-port="0" to-layer="472" to-port="1" /> <edge from-layer="470" from-port="0" to-layer="472" to-port="2" /> <edge from-layer="471" from-port="0" to-layer="472" to-port="3" /> <edge from-layer="472" from-port="5" to-layer="474" to-port="0" /> <edge from-layer="473" from-port="0" to-layer="474" to-port="1" /> <edge from-layer="474" from-port="2" to-layer="476" to-port="0" /> <edge from-layer="475" from-port="0" to-layer="476" to-port="1" /> <edge from-layer="476" from-port="2" to-layer="477" to-port="0" /> <edge from-layer="476" from-port="2" to-layer="481" to-port="0" /> <edge from-layer="476" from-port="2" to-layer="488" to-port="0" /> <edge from-layer="477" from-port="2" to-layer="491" to-port="0" /> <edge from-layer="478" from-port="0" to-layer="481" to-port="1" /> <edge from-layer="479" from-port="0" to-layer="481" to-port="2" /> <edge from-layer="480" from-port="0" to-layer="481" to-port="3" /> <edge from-layer="481" from-port="5" to-layer="484" to-port="0" /> <edge from-layer="482" from-port="0" to-layer="483" to-port="0" /> <edge from-layer="483" from-port="1" to-layer="484" to-port="1" /> <edge from-layer="484" from-port="2" to-layer="489" to-port="0" /> <edge from-layer="485" from-port="0" to-layer="488" to-port="1" /> <edge from-layer="486" from-port="0" to-layer="488" to-port="2" /> <edge from-layer="487" from-port="0" to-layer="488" to-port="3" /> <edge from-layer="488" from-port="5" to-layer="489" to-port="1" /> <edge from-layer="489" from-port="2" to-layer="490" to-port="0" /> <edge from-layer="490" from-port="2" to-layer="491" to-port="1" /> <edge from-layer="491" from-port="2" to-layer="492" to-port="1" /> <edge from-layer="492" from-port="2" to-layer="4286" to-port="0" /> <edge from-layer="492" from-port="2" to-layer="512" to-port="1" /> <edge from-layer="493" from-port="0" to-layer="494" to-port="0" /> <edge from-layer="494" from-port="1" to-layer="499" to-port="0" /> <edge from-layer="495" from-port="0" to-layer="498" to-port="1" /> <edge from-layer="496" from-port="0" to-layer="498" to-port="2" /> <edge from-layer="497" from-port="0" to-layer="498" to-port="3" /> <edge from-layer="498" from-port="4" to-layer="499" to-port="1" /> <edge from-layer="499" from-port="2" to-layer="500" to-port="0" /> <edge from-layer="500" from-port="1" to-layer="502" to-port="0" /> <edge from-layer="501" from-port="0" to-layer="502" to-port="2" /> <edge from-layer="502" from-port="3" to-layer="511" to-port="0" /> <edge from-layer="503" from-port="0" to-layer="506" to-port="1" /> <edge from-layer="504" from-port="0" to-layer="506" to-port="2" /> <edge from-layer="505" from-port="0" to-layer="506" to-port="3" /> <edge from-layer="506" from-port="5" to-layer="508" to-port="0" /> <edge from-layer="507" from-port="0" to-layer="508" to-port="1" /> <edge from-layer="508" from-port="2" to-layer="510" to-port="0" /> <edge from-layer="509" from-port="0" to-layer="510" to-port="1" /> <edge from-layer="510" from-port="2" to-layer="511" to-port="1" /> <edge from-layer="511" from-port="2" to-layer="4285" to-port="0" /> <edge from-layer="511" from-port="2" to-layer="512" to-port="2" /> <edge from-layer="512" from-port="4" to-layer="514" to-port="0" /> <edge from-layer="513" from-port="0" to-layer="514" to-port="1" /> <edge from-layer="514" from-port="2" to-layer="516" to-port="0" /> <edge from-layer="515" from-port="0" to-layer="516" to-port="1" /> <edge from-layer="516" from-port="2" to-layer="519" to-port="0" /> <edge from-layer="517" from-port="0" to-layer="518" to-port="0" /> <edge from-layer="518" from-port="1" to-layer="519" to-port="1" /> <edge from-layer="519" from-port="2" to-layer="520" to-port="1" /> <edge from-layer="520" from-port="2" to-layer="535" to-port="0" /> <edge from-layer="520" from-port="2" to-layer="546" to-port="0" /> <edge from-layer="520" from-port="2" to-layer="527" to-port="0" /> <edge from-layer="521" from-port="0" to-layer="522" to-port="0" /> <edge from-layer="522" from-port="1" to-layer="536" to-port="0" /> <edge from-layer="523" from-port="0" to-layer="524" to-port="0" /> <edge from-layer="524" from-port="1" to-layer="534" to-port="0" /> <edge from-layer="525" from-port="0" to-layer="526" to-port="0" /> <edge from-layer="526" from-port="1" to-layer="527" to-port="1" /> <edge from-layer="527" from-port="2" to-layer="529" to-port="0" /> <edge from-layer="528" from-port="0" to-layer="529" to-port="1" /> <edge from-layer="529" from-port="2" to-layer="532" to-port="0" /> <edge from-layer="530" from-port="0" to-layer="531" to-port="0" /> <edge from-layer="531" from-port="1" to-layer="532" to-port="1" /> <edge from-layer="532" from-port="2" to-layer="533" to-port="0" /> <edge from-layer="533" from-port="1" to-layer="534" to-port="1" /> <edge from-layer="534" from-port="2" to-layer="535" to-port="1" /> <edge from-layer="535" from-port="2" to-layer="536" to-port="1" /> <edge from-layer="536" from-port="2" to-layer="539" to-port="0" /> <edge from-layer="537" from-port="0" to-layer="538" to-port="0" /> <edge from-layer="538" from-port="1" to-layer="539" to-port="1" /> <edge from-layer="539" from-port="2" to-layer="540" to-port="0" /> <edge from-layer="540" from-port="4" to-layer="542" to-port="0" /> <edge from-layer="540" from-port="3" to-layer="541" to-port="0" /> <edge from-layer="541" from-port="1" to-layer="542" to-port="1" /> <edge from-layer="542" from-port="2" to-layer="545" to-port="0" /> <edge from-layer="543" from-port="0" to-layer="544" to-port="0" /> <edge from-layer="544" from-port="1" to-layer="545" to-port="1" /> <edge from-layer="545" from-port="2" to-layer="546" to-port="1" /> <edge from-layer="546" from-port="2" to-layer="553" to-port="0" /> <edge from-layer="546" from-port="2" to-layer="561" to-port="0" /> <edge from-layer="546" from-port="2" to-layer="650" to-port="0" /> <edge from-layer="547" from-port="0" to-layer="548" to-port="0" /> <edge from-layer="548" from-port="1" to-layer="562" to-port="0" /> <edge from-layer="549" from-port="0" to-layer="550" to-port="0" /> <edge from-layer="550" from-port="1" to-layer="560" to-port="0" /> <edge from-layer="551" from-port="0" to-layer="552" to-port="0" /> <edge from-layer="552" from-port="1" to-layer="553" to-port="1" /> <edge from-layer="553" from-port="2" to-layer="555" to-port="0" /> <edge from-layer="554" from-port="0" to-layer="555" to-port="1" /> <edge from-layer="555" from-port="2" to-layer="558" to-port="0" /> <edge from-layer="556" from-port="0" to-layer="557" to-port="0" /> <edge from-layer="557" from-port="1" to-layer="558" to-port="1" /> <edge from-layer="558" from-port="2" to-layer="559" to-port="0" /> <edge from-layer="559" from-port="1" to-layer="560" to-port="1" /> <edge from-layer="560" from-port="2" to-layer="561" to-port="1" /> <edge from-layer="561" from-port="2" to-layer="562" to-port="1" /> <edge from-layer="562" from-port="2" to-layer="565" to-port="0" /> <edge from-layer="563" from-port="0" to-layer="564" to-port="0" /> <edge from-layer="564" from-port="1" to-layer="565" to-port="1" /> <edge from-layer="565" from-port="2" to-layer="569" to-port="0" /> <edge from-layer="565" from-port="2" to-layer="602" to-port="0" /> <edge from-layer="565" from-port="2" to-layer="636" to-port="0" /> <edge from-layer="566" from-port="0" to-layer="569" to-port="1" /> <edge from-layer="567" from-port="0" to-layer="569" to-port="2" /> <edge from-layer="568" from-port="0" to-layer="569" to-port="3" /> <edge from-layer="569" from-port="5" to-layer="571" to-port="0" /> <edge from-layer="570" from-port="0" to-layer="571" to-port="1" /> <edge from-layer="571" from-port="2" to-layer="573" to-port="0" /> <edge from-layer="572" from-port="0" to-layer="573" to-port="1" /> <edge from-layer="573" from-port="2" to-layer="578" to-port="0" /> <edge from-layer="573" from-port="2" to-layer="574" to-port="0" /> <edge from-layer="573" from-port="2" to-layer="585" to-port="0" /> <edge from-layer="574" from-port="2" to-layer="588" to-port="0" /> <edge from-layer="575" from-port="0" to-layer="578" to-port="1" /> <edge from-layer="576" from-port="0" to-layer="578" to-port="2" /> <edge from-layer="577" from-port="0" to-layer="578" to-port="3" /> <edge from-layer="578" from-port="5" to-layer="581" to-port="0" /> <edge from-layer="579" from-port="0" to-layer="580" to-port="0" /> <edge from-layer="580" from-port="1" to-layer="581" to-port="1" /> <edge from-layer="581" from-port="2" to-layer="586" to-port="0" /> <edge from-layer="582" from-port="0" to-layer="585" to-port="1" /> <edge from-layer="583" from-port="0" to-layer="585" to-port="2" /> <edge from-layer="584" from-port="0" to-layer="585" to-port="3" /> <edge from-layer="585" from-port="5" to-layer="586" to-port="1" /> <edge from-layer="586" from-port="2" to-layer="587" to-port="0" /> <edge from-layer="587" from-port="2" to-layer="588" to-port="1" /> <edge from-layer="588" from-port="2" to-layer="642" to-port="0" /> <edge from-layer="589" from-port="0" to-layer="590" to-port="0" /> <edge from-layer="590" from-port="1" to-layer="595" to-port="0" /> <edge from-layer="591" from-port="0" to-layer="594" to-port="1" /> <edge from-layer="592" from-port="0" to-layer="594" to-port="2" /> <edge from-layer="593" from-port="0" to-layer="594" to-port="3" /> <edge from-layer="594" from-port="4" to-layer="595" to-port="1" /> <edge from-layer="595" from-port="2" to-layer="596" to-port="0" /> <edge from-layer="596" from-port="1" to-layer="598" to-port="0" /> <edge from-layer="597" from-port="0" to-layer="598" to-port="2" /> <edge from-layer="598" from-port="3" to-layer="622" to-port="0" /> <edge from-layer="599" from-port="0" to-layer="602" to-port="1" /> <edge from-layer="600" from-port="0" to-layer="602" to-port="2" /> <edge from-layer="601" from-port="0" to-layer="602" to-port="3" /> <edge from-layer="602" from-port="5" to-layer="604" to-port="0" /> <edge from-layer="603" from-port="0" to-layer="604" to-port="1" /> <edge from-layer="604" from-port="2" to-layer="606" to-port="0" /> <edge from-layer="605" from-port="0" to-layer="606" to-port="1" /> <edge from-layer="606" from-port="2" to-layer="618" to-port="0" /> <edge from-layer="606" from-port="2" to-layer="611" to-port="0" /> <edge from-layer="606" from-port="2" to-layer="607" to-port="0" /> <edge from-layer="607" from-port="2" to-layer="621" to-port="0" /> <edge from-layer="608" from-port="0" to-layer="611" to-port="1" /> <edge from-layer="609" from-port="0" to-layer="611" to-port="2" /> <edge from-layer="610" from-port="0" to-layer="611" to-port="3" /> <edge from-layer="611" from-port="5" to-layer="614" to-port="0" /> <edge from-layer="612" from-port="0" to-layer="613" to-port="0" /> <edge from-layer="613" from-port="1" to-layer="614" to-port="1" /> <edge from-layer="614" from-port="2" to-layer="619" to-port="0" /> <edge from-layer="615" from-port="0" to-layer="618" to-port="1" /> <edge from-layer="616" from-port="0" to-layer="618" to-port="2" /> <edge from-layer="617" from-port="0" to-layer="618" to-port="3" /> <edge from-layer="618" from-port="5" to-layer="619" to-port="1" /> <edge from-layer="619" from-port="2" to-layer="620" to-port="0" /> <edge from-layer="620" from-port="2" to-layer="621" to-port="1" /> <edge from-layer="621" from-port="2" to-layer="622" to-port="1" /> <edge from-layer="622" from-port="2" to-layer="4264" to-port="0" /> <edge from-layer="622" from-port="2" to-layer="642" to-port="1" /> <edge from-layer="623" from-port="0" to-layer="624" to-port="0" /> <edge from-layer="624" from-port="1" to-layer="629" to-port="0" /> <edge from-layer="625" from-port="0" to-layer="628" to-port="1" /> <edge from-layer="626" from-port="0" to-layer="628" to-port="2" /> <edge from-layer="627" from-port="0" to-layer="628" to-port="3" /> <edge from-layer="628" from-port="4" to-layer="629" to-port="1" /> <edge from-layer="629" from-port="2" to-layer="630" to-port="0" /> <edge from-layer="630" from-port="1" to-layer="632" to-port="0" /> <edge from-layer="631" from-port="0" to-layer="632" to-port="2" /> <edge from-layer="632" from-port="3" to-layer="641" to-port="0" /> <edge from-layer="633" from-port="0" to-layer="636" to-port="1" /> <edge from-layer="634" from-port="0" to-layer="636" to-port="2" /> <edge from-layer="635" from-port="0" to-layer="636" to-port="3" /> <edge from-layer="636" from-port="5" to-layer="638" to-port="0" /> <edge from-layer="637" from-port="0" to-layer="638" to-port="1" /> <edge from-layer="638" from-port="2" to-layer="640" to-port="0" /> <edge from-layer="639" from-port="0" to-layer="640" to-port="1" /> <edge from-layer="640" from-port="2" to-layer="641" to-port="1" /> <edge from-layer="641" from-port="2" to-layer="642" to-port="2" /> <edge from-layer="641" from-port="2" to-layer="4263" to-port="0" /> <edge from-layer="642" from-port="4" to-layer="644" to-port="0" /> <edge from-layer="643" from-port="0" to-layer="644" to-port="1" /> <edge from-layer="644" from-port="2" to-layer="646" to-port="0" /> <edge from-layer="645" from-port="0" to-layer="646" to-port="1" /> <edge from-layer="646" from-port="2" to-layer="649" to-port="0" /> <edge from-layer="647" from-port="0" to-layer="648" to-port="0" /> <edge from-layer="648" from-port="1" to-layer="649" to-port="1" /> <edge from-layer="649" from-port="2" to-layer="650" to-port="1" /> <edge from-layer="650" from-port="2" to-layer="665" to-port="0" /> <edge from-layer="650" from-port="2" to-layer="676" to-port="0" /> <edge from-layer="650" from-port="2" to-layer="657" to-port="0" /> <edge from-layer="651" from-port="0" to-layer="652" to-port="0" /> <edge from-layer="652" from-port="1" to-layer="666" to-port="0" /> <edge from-layer="653" from-port="0" to-layer="654" to-port="0" /> <edge from-layer="654" from-port="1" to-layer="664" to-port="0" /> <edge from-layer="655" from-port="0" to-layer="656" to-port="0" /> <edge from-layer="656" from-port="1" to-layer="657" to-port="1" /> <edge from-layer="657" from-port="2" to-layer="659" to-port="0" /> <edge from-layer="658" from-port="0" to-layer="659" to-port="1" /> <edge from-layer="659" from-port="2" to-layer="662" to-port="0" /> <edge from-layer="660" from-port="0" to-layer="661" to-port="0" /> <edge from-layer="661" from-port="1" to-layer="662" to-port="1" /> <edge from-layer="662" from-port="2" to-layer="663" to-port="0" /> <edge from-layer="663" from-port="1" to-layer="664" to-port="1" /> <edge from-layer="664" from-port="2" to-layer="665" to-port="1" /> <edge from-layer="665" from-port="2" to-layer="666" to-port="1" /> <edge from-layer="666" from-port="2" to-layer="669" to-port="0" /> <edge from-layer="667" from-port="0" to-layer="668" to-port="0" /> <edge from-layer="668" from-port="1" to-layer="669" to-port="1" /> <edge from-layer="669" from-port="2" to-layer="670" to-port="0" /> <edge from-layer="670" from-port="4" to-layer="672" to-port="0" /> <edge from-layer="670" from-port="3" to-layer="671" to-port="0" /> <edge from-layer="671" from-port="1" to-layer="672" to-port="1" /> <edge from-layer="672" from-port="2" to-layer="675" to-port="0" /> <edge from-layer="673" from-port="0" to-layer="674" to-port="0" /> <edge from-layer="674" from-port="1" to-layer="675" to-port="1" /> <edge from-layer="675" from-port="2" to-layer="676" to-port="1" /> <edge from-layer="676" from-port="2" to-layer="780" to-port="0" /> <edge from-layer="676" from-port="2" to-layer="691" to-port="0" /> <edge from-layer="676" from-port="2" to-layer="683" to-port="0" /> <edge from-layer="677" from-port="0" to-layer="678" to-port="0" /> <edge from-layer="678" from-port="1" to-layer="692" to-port="0" /> <edge from-layer="679" from-port="0" to-layer="680" to-port="0" /> <edge from-layer="680" from-port="1" to-layer="690" to-port="0" /> <edge from-layer="681" from-port="0" to-layer="682" to-port="0" /> <edge from-layer="682" from-port="1" to-layer="683" to-port="1" /> <edge from-layer="683" from-port="2" to-layer="685" to-port="0" /> <edge from-layer="684" from-port="0" to-layer="685" to-port="1" /> <edge from-layer="685" from-port="2" to-layer="688" to-port="0" /> <edge from-layer="686" from-port="0" to-layer="687" to-port="0" /> <edge from-layer="687" from-port="1" to-layer="688" to-port="1" /> <edge from-layer="688" from-port="2" to-layer="689" to-port="0" /> <edge from-layer="689" from-port="1" to-layer="690" to-port="1" /> <edge from-layer="690" from-port="2" to-layer="691" to-port="1" /> <edge from-layer="691" from-port="2" to-layer="692" to-port="1" /> <edge from-layer="692" from-port="2" to-layer="695" to-port="0" /> <edge from-layer="693" from-port="0" to-layer="694" to-port="0" /> <edge from-layer="694" from-port="1" to-layer="695" to-port="1" /> <edge from-layer="695" from-port="2" to-layer="766" to-port="0" /> <edge from-layer="695" from-port="2" to-layer="699" to-port="0" /> <edge from-layer="695" from-port="2" to-layer="732" to-port="0" /> <edge from-layer="696" from-port="0" to-layer="699" to-port="1" /> <edge from-layer="697" from-port="0" to-layer="699" to-port="2" /> <edge from-layer="698" from-port="0" to-layer="699" to-port="3" /> <edge from-layer="699" from-port="5" to-layer="701" to-port="0" /> <edge from-layer="700" from-port="0" to-layer="701" to-port="1" /> <edge from-layer="701" from-port="2" to-layer="703" to-port="0" /> <edge from-layer="702" from-port="0" to-layer="703" to-port="1" /> <edge from-layer="703" from-port="2" to-layer="704" to-port="0" /> <edge from-layer="703" from-port="2" to-layer="708" to-port="0" /> <edge from-layer="703" from-port="2" to-layer="715" to-port="0" /> <edge from-layer="704" from-port="2" to-layer="718" to-port="0" /> <edge from-layer="705" from-port="0" to-layer="708" to-port="1" /> <edge from-layer="706" from-port="0" to-layer="708" to-port="2" /> <edge from-layer="707" from-port="0" to-layer="708" to-port="3" /> <edge from-layer="708" from-port="5" to-layer="711" to-port="0" /> <edge from-layer="709" from-port="0" to-layer="710" to-port="0" /> <edge from-layer="710" from-port="1" to-layer="711" to-port="1" /> <edge from-layer="711" from-port="2" to-layer="716" to-port="0" /> <edge from-layer="712" from-port="0" to-layer="715" to-port="1" /> <edge from-layer="713" from-port="0" to-layer="715" to-port="2" /> <edge from-layer="714" from-port="0" to-layer="715" to-port="3" /> <edge from-layer="715" from-port="5" to-layer="716" to-port="1" /> <edge from-layer="716" from-port="2" to-layer="717" to-port="0" /> <edge from-layer="717" from-port="2" to-layer="718" to-port="1" /> <edge from-layer="718" from-port="2" to-layer="772" to-port="0" /> <edge from-layer="719" from-port="0" to-layer="720" to-port="0" /> <edge from-layer="720" from-port="1" to-layer="725" to-port="0" /> <edge from-layer="721" from-port="0" to-layer="724" to-port="1" /> <edge from-layer="722" from-port="0" to-layer="724" to-port="2" /> <edge from-layer="723" from-port="0" to-layer="724" to-port="3" /> <edge from-layer="724" from-port="4" to-layer="725" to-port="1" /> <edge from-layer="725" from-port="2" to-layer="726" to-port="0" /> <edge from-layer="726" from-port="1" to-layer="728" to-port="0" /> <edge from-layer="727" from-port="0" to-layer="728" to-port="2" /> <edge from-layer="728" from-port="3" to-layer="752" to-port="0" /> <edge from-layer="729" from-port="0" to-layer="732" to-port="1" /> <edge from-layer="730" from-port="0" to-layer="732" to-port="2" /> <edge from-layer="731" from-port="0" to-layer="732" to-port="3" /> <edge from-layer="732" from-port="5" to-layer="734" to-port="0" /> <edge from-layer="733" from-port="0" to-layer="734" to-port="1" /> <edge from-layer="734" from-port="2" to-layer="736" to-port="0" /> <edge from-layer="735" from-port="0" to-layer="736" to-port="1" /> <edge from-layer="736" from-port="2" to-layer="737" to-port="0" /> <edge from-layer="736" from-port="2" to-layer="741" to-port="0" /> <edge from-layer="736" from-port="2" to-layer="748" to-port="0" /> <edge from-layer="737" from-port="2" to-layer="751" to-port="0" /> <edge from-layer="738" from-port="0" to-layer="741" to-port="1" /> <edge from-layer="739" from-port="0" to-layer="741" to-port="2" /> <edge from-layer="740" from-port="0" to-layer="741" to-port="3" /> <edge from-layer="741" from-port="5" to-layer="744" to-port="0" /> <edge from-layer="742" from-port="0" to-layer="743" to-port="0" /> <edge from-layer="743" from-port="1" to-layer="744" to-port="1" /> <edge from-layer="744" from-port="2" to-layer="749" to-port="0" /> <edge from-layer="745" from-port="0" to-layer="748" to-port="1" /> <edge from-layer="746" from-port="0" to-layer="748" to-port="2" /> <edge from-layer="747" from-port="0" to-layer="748" to-port="3" /> <edge from-layer="748" from-port="5" to-layer="749" to-port="1" /> <edge from-layer="749" from-port="2" to-layer="750" to-port="0" /> <edge from-layer="750" from-port="2" to-layer="751" to-port="1" /> <edge from-layer="751" from-port="2" to-layer="752" to-port="1" /> <edge from-layer="752" from-port="2" to-layer="1398" to-port="0" /> <edge from-layer="752" from-port="2" to-layer="772" to-port="1" /> <edge from-layer="753" from-port="0" to-layer="754" to-port="0" /> <edge from-layer="754" from-port="1" to-layer="759" to-port="0" /> <edge from-layer="755" from-port="0" to-layer="758" to-port="1" /> <edge from-layer="756" from-port="0" to-layer="758" to-port="2" /> <edge from-layer="757" from-port="0" to-layer="758" to-port="3" /> <edge from-layer="758" from-port="4" to-layer="759" to-port="1" /> <edge from-layer="759" from-port="2" to-layer="760" to-port="0" /> <edge from-layer="760" from-port="1" to-layer="762" to-port="0" /> <edge from-layer="761" from-port="0" to-layer="762" to-port="2" /> <edge from-layer="762" from-port="3" to-layer="771" to-port="0" /> <edge from-layer="763" from-port="0" to-layer="766" to-port="1" /> <edge from-layer="764" from-port="0" to-layer="766" to-port="2" /> <edge from-layer="765" from-port="0" to-layer="766" to-port="3" /> <edge from-layer="766" from-port="5" to-layer="768" to-port="0" /> <edge from-layer="767" from-port="0" to-layer="768" to-port="1" /> <edge from-layer="768" from-port="2" to-layer="770" to-port="0" /> <edge from-layer="769" from-port="0" to-layer="770" to-port="1" /> <edge from-layer="770" from-port="2" to-layer="771" to-port="1" /> <edge from-layer="771" from-port="2" to-layer="772" to-port="2" /> <edge from-layer="771" from-port="2" to-layer="1397" to-port="0" /> <edge from-layer="772" from-port="4" to-layer="774" to-port="0" /> <edge from-layer="773" from-port="0" to-layer="774" to-port="1" /> <edge from-layer="774" from-port="2" to-layer="776" to-port="0" /> <edge from-layer="775" from-port="0" to-layer="776" to-port="1" /> <edge from-layer="776" from-port="2" to-layer="779" to-port="0" /> <edge from-layer="777" from-port="0" to-layer="778" to-port="0" /> <edge from-layer="778" from-port="1" to-layer="779" to-port="1" /> <edge from-layer="779" from-port="2" to-layer="780" to-port="1" /> <edge from-layer="780" from-port="2" to-layer="795" to-port="0" /> <edge from-layer="780" from-port="2" to-layer="806" to-port="0" /> <edge from-layer="780" from-port="2" to-layer="787" to-port="0" /> <edge from-layer="781" from-port="0" to-layer="782" to-port="0" /> <edge from-layer="782" from-port="1" to-layer="796" to-port="0" /> <edge from-layer="783" from-port="0" to-layer="784" to-port="0" /> <edge from-layer="784" from-port="1" to-layer="794" to-port="0" /> <edge from-layer="785" from-port="0" to-layer="786" to-port="0" /> <edge from-layer="786" from-port="1" to-layer="787" to-port="1" /> <edge from-layer="787" from-port="2" to-layer="789" to-port="0" /> <edge from-layer="788" from-port="0" to-layer="789" to-port="1" /> <edge from-layer="789" from-port="2" to-layer="792" to-port="0" /> <edge from-layer="790" from-port="0" to-layer="791" to-port="0" /> <edge from-layer="791" from-port="1" to-layer="792" to-port="1" /> <edge from-layer="792" from-port="2" to-layer="793" to-port="0" /> <edge from-layer="793" from-port="1" to-layer="794" to-port="1" /> <edge from-layer="794" from-port="2" to-layer="795" to-port="1" /> <edge from-layer="795" from-port="2" to-layer="796" to-port="1" /> <edge from-layer="796" from-port="2" to-layer="799" to-port="0" /> <edge from-layer="797" from-port="0" to-layer="798" to-port="0" /> <edge from-layer="798" from-port="1" to-layer="799" to-port="1" /> <edge from-layer="799" from-port="2" to-layer="800" to-port="0" /> <edge from-layer="800" from-port="4" to-layer="802" to-port="0" /> <edge from-layer="800" from-port="3" to-layer="801" to-port="0" /> <edge from-layer="801" from-port="1" to-layer="802" to-port="1" /> <edge from-layer="802" from-port="2" to-layer="805" to-port="0" /> <edge from-layer="803" from-port="0" to-layer="804" to-port="0" /> <edge from-layer="804" from-port="1" to-layer="805" to-port="1" /> <edge from-layer="805" from-port="2" to-layer="806" to-port="1" /> <edge from-layer="806" from-port="2" to-layer="821" to-port="0" /> <edge from-layer="806" from-port="2" to-layer="910" to-port="0" /> <edge from-layer="806" from-port="2" to-layer="813" to-port="0" /> <edge from-layer="807" from-port="0" to-layer="808" to-port="0" /> <edge from-layer="808" from-port="1" to-layer="822" to-port="0" /> <edge from-layer="809" from-port="0" to-layer="810" to-port="0" /> <edge from-layer="810" from-port="1" to-layer="820" to-port="0" /> <edge from-layer="811" from-port="0" to-layer="812" to-port="0" /> <edge from-layer="812" from-port="1" to-layer="813" to-port="1" /> <edge from-layer="813" from-port="2" to-layer="815" to-port="0" /> <edge from-layer="814" from-port="0" to-layer="815" to-port="1" /> <edge from-layer="815" from-port="2" to-layer="818" to-port="0" /> <edge from-layer="816" from-port="0" to-layer="817" to-port="0" /> <edge from-layer="817" from-port="1" to-layer="818" to-port="1" /> <edge from-layer="818" from-port="2" to-layer="819" to-port="0" /> <edge from-layer="819" from-port="1" to-layer="820" to-port="1" /> <edge from-layer="820" from-port="2" to-layer="821" to-port="1" /> <edge from-layer="821" from-port="2" to-layer="822" to-port="1" /> <edge from-layer="822" from-port="2" to-layer="825" to-port="0" /> <edge from-layer="823" from-port="0" to-layer="824" to-port="0" /> <edge from-layer="824" from-port="1" to-layer="825" to-port="1" /> <edge from-layer="825" from-port="2" to-layer="862" to-port="0" /> <edge from-layer="825" from-port="2" to-layer="829" to-port="0" /> <edge from-layer="825" from-port="2" to-layer="896" to-port="0" /> <edge from-layer="826" from-port="0" to-layer="829" to-port="1" /> <edge from-layer="827" from-port="0" to-layer="829" to-port="2" /> <edge from-layer="828" from-port="0" to-layer="829" to-port="3" /> <edge from-layer="829" from-port="5" to-layer="831" to-port="0" /> <edge from-layer="830" from-port="0" to-layer="831" to-port="1" /> <edge from-layer="831" from-port="2" to-layer="833" to-port="0" /> <edge from-layer="832" from-port="0" to-layer="833" to-port="1" /> <edge from-layer="833" from-port="2" to-layer="838" to-port="0" /> <edge from-layer="833" from-port="2" to-layer="845" to-port="0" /> <edge from-layer="833" from-port="2" to-layer="834" to-port="0" /> <edge from-layer="834" from-port="2" to-layer="848" to-port="0" /> <edge from-layer="835" from-port="0" to-layer="838" to-port="1" /> <edge from-layer="836" from-port="0" to-layer="838" to-port="2" /> <edge from-layer="837" from-port="0" to-layer="838" to-port="3" /> <edge from-layer="838" from-port="5" to-layer="841" to-port="0" /> <edge from-layer="839" from-port="0" to-layer="840" to-port="0" /> <edge from-layer="840" from-port="1" to-layer="841" to-port="1" /> <edge from-layer="841" from-port="2" to-layer="846" to-port="0" /> <edge from-layer="842" from-port="0" to-layer="845" to-port="1" /> <edge from-layer="843" from-port="0" to-layer="845" to-port="2" /> <edge from-layer="844" from-port="0" to-layer="845" to-port="3" /> <edge from-layer="845" from-port="5" to-layer="846" to-port="1" /> <edge from-layer="846" from-port="2" to-layer="847" to-port="0" /> <edge from-layer="847" from-port="2" to-layer="848" to-port="1" /> <edge from-layer="848" from-port="2" to-layer="902" to-port="0" /> <edge from-layer="849" from-port="0" to-layer="850" to-port="0" /> <edge from-layer="850" from-port="1" to-layer="855" to-port="0" /> <edge from-layer="851" from-port="0" to-layer="854" to-port="1" /> <edge from-layer="852" from-port="0" to-layer="854" to-port="2" /> <edge from-layer="853" from-port="0" to-layer="854" to-port="3" /> <edge from-layer="854" from-port="4" to-layer="855" to-port="1" /> <edge from-layer="855" from-port="2" to-layer="856" to-port="0" /> <edge from-layer="856" from-port="1" to-layer="858" to-port="0" /> <edge from-layer="857" from-port="0" to-layer="858" to-port="2" /> <edge from-layer="858" from-port="3" to-layer="882" to-port="0" /> <edge from-layer="859" from-port="0" to-layer="862" to-port="1" /> <edge from-layer="860" from-port="0" to-layer="862" to-port="2" /> <edge from-layer="861" from-port="0" to-layer="862" to-port="3" /> <edge from-layer="862" from-port="5" to-layer="864" to-port="0" /> <edge from-layer="863" from-port="0" to-layer="864" to-port="1" /> <edge from-layer="864" from-port="2" to-layer="866" to-port="0" /> <edge from-layer="865" from-port="0" to-layer="866" to-port="1" /> <edge from-layer="866" from-port="2" to-layer="871" to-port="0" /> <edge from-layer="866" from-port="2" to-layer="878" to-port="0" /> <edge from-layer="866" from-port="2" to-layer="867" to-port="0" /> <edge from-layer="867" from-port="2" to-layer="881" to-port="0" /> <edge from-layer="868" from-port="0" to-layer="871" to-port="1" /> <edge from-layer="869" from-port="0" to-layer="871" to-port="2" /> <edge from-layer="870" from-port="0" to-layer="871" to-port="3" /> <edge from-layer="871" from-port="5" to-layer="874" to-port="0" /> <edge from-layer="872" from-port="0" to-layer="873" to-port="0" /> <edge from-layer="873" from-port="1" to-layer="874" to-port="1" /> <edge from-layer="874" from-port="2" to-layer="879" to-port="0" /> <edge from-layer="875" from-port="0" to-layer="878" to-port="1" /> <edge from-layer="876" from-port="0" to-layer="878" to-port="2" /> <edge from-layer="877" from-port="0" to-layer="878" to-port="3" /> <edge from-layer="878" from-port="5" to-layer="879" to-port="1" /> <edge from-layer="879" from-port="2" to-layer="880" to-port="0" /> <edge from-layer="880" from-port="2" to-layer="881" to-port="1" /> <edge from-layer="881" from-port="2" to-layer="882" to-port="1" /> <edge from-layer="882" from-port="2" to-layer="902" to-port="1" /> <edge from-layer="882" from-port="2" to-layer="1396" to-port="0" /> <edge from-layer="883" from-port="0" to-layer="884" to-port="0" /> <edge from-layer="884" from-port="1" to-layer="889" to-port="0" /> <edge from-layer="885" from-port="0" to-layer="888" to-port="1" /> <edge from-layer="886" from-port="0" to-layer="888" to-port="2" /> <edge from-layer="887" from-port="0" to-layer="888" to-port="3" /> <edge from-layer="888" from-port="4" to-layer="889" to-port="1" /> <edge from-layer="889" from-port="2" to-layer="890" to-port="0" /> <edge from-layer="890" from-port="1" to-layer="892" to-port="0" /> <edge from-layer="891" from-port="0" to-layer="892" to-port="2" /> <edge from-layer="892" from-port="3" to-layer="901" to-port="0" /> <edge from-layer="893" from-port="0" to-layer="896" to-port="1" /> <edge from-layer="894" from-port="0" to-layer="896" to-port="2" /> <edge from-layer="895" from-port="0" to-layer="896" to-port="3" /> <edge from-layer="896" from-port="5" to-layer="898" to-port="0" /> <edge from-layer="897" from-port="0" to-layer="898" to-port="1" /> <edge from-layer="898" from-port="2" to-layer="900" to-port="0" /> <edge from-layer="899" from-port="0" to-layer="900" to-port="1" /> <edge from-layer="900" from-port="2" to-layer="901" to-port="1" /> <edge from-layer="901" from-port="2" to-layer="902" to-port="2" /> <edge from-layer="901" from-port="2" to-layer="1395" to-port="0" /> <edge from-layer="902" from-port="4" to-layer="904" to-port="0" /> <edge from-layer="903" from-port="0" to-layer="904" to-port="1" /> <edge from-layer="904" from-port="2" to-layer="906" to-port="0" /> <edge from-layer="905" from-port="0" to-layer="906" to-port="1" /> <edge from-layer="906" from-port="2" to-layer="909" to-port="0" /> <edge from-layer="907" from-port="0" to-layer="908" to-port="0" /> <edge from-layer="908" from-port="1" to-layer="909" to-port="1" /> <edge from-layer="909" from-port="2" to-layer="910" to-port="1" /> <edge from-layer="910" from-port="2" to-layer="936" to-port="0" /> <edge from-layer="910" from-port="2" to-layer="917" to-port="0" /> <edge from-layer="910" from-port="2" to-layer="925" to-port="0" /> <edge from-layer="911" from-port="0" to-layer="912" to-port="0" /> <edge from-layer="912" from-port="1" to-layer="926" to-port="0" /> <edge from-layer="913" from-port="0" to-layer="914" to-port="0" /> <edge from-layer="914" from-port="1" to-layer="924" to-port="0" /> <edge from-layer="915" from-port="0" to-layer="916" to-port="0" /> <edge from-layer="916" from-port="1" to-layer="917" to-port="1" /> <edge from-layer="917" from-port="2" to-layer="919" to-port="0" /> <edge from-layer="918" from-port="0" to-layer="919" to-port="1" /> <edge from-layer="919" from-port="2" to-layer="922" to-port="0" /> <edge from-layer="920" from-port="0" to-layer="921" to-port="0" /> <edge from-layer="921" from-port="1" to-layer="922" to-port="1" /> <edge from-layer="922" from-port="2" to-layer="923" to-port="0" /> <edge from-layer="923" from-port="1" to-layer="924" to-port="1" /> <edge from-layer="924" from-port="2" to-layer="925" to-port="1" /> <edge from-layer="925" from-port="2" to-layer="926" to-port="1" /> <edge from-layer="926" from-port="2" to-layer="929" to-port="0" /> <edge from-layer="927" from-port="0" to-layer="928" to-port="0" /> <edge from-layer="928" from-port="1" to-layer="929" to-port="1" /> <edge from-layer="929" from-port="2" to-layer="930" to-port="0" /> <edge from-layer="930" from-port="4" to-layer="932" to-port="0" /> <edge from-layer="930" from-port="3" to-layer="931" to-port="0" /> <edge from-layer="931" from-port="1" to-layer="932" to-port="1" /> <edge from-layer="932" from-port="2" to-layer="935" to-port="0" /> <edge from-layer="933" from-port="0" to-layer="934" to-port="0" /> <edge from-layer="934" from-port="1" to-layer="935" to-port="1" /> <edge from-layer="935" from-port="2" to-layer="936" to-port="1" /> <edge from-layer="936" from-port="2" to-layer="1040" to-port="0" /> <edge from-layer="936" from-port="2" to-layer="943" to-port="0" /> <edge from-layer="936" from-port="2" to-layer="951" to-port="0" /> <edge from-layer="937" from-port="0" to-layer="938" to-port="0" /> <edge from-layer="938" from-port="1" to-layer="952" to-port="0" /> <edge from-layer="939" from-port="0" to-layer="940" to-port="0" /> <edge from-layer="940" from-port="1" to-layer="950" to-port="0" /> <edge from-layer="941" from-port="0" to-layer="942" to-port="0" /> <edge from-layer="942" from-port="1" to-layer="943" to-port="1" /> <edge from-layer="943" from-port="2" to-layer="945" to-port="0" /> <edge from-layer="944" from-port="0" to-layer="945" to-port="1" /> <edge from-layer="945" from-port="2" to-layer="948" to-port="0" /> <edge from-layer="946" from-port="0" to-layer="947" to-port="0" /> <edge from-layer="947" from-port="1" to-layer="948" to-port="1" /> <edge from-layer="948" from-port="2" to-layer="949" to-port="0" /> <edge from-layer="949" from-port="1" to-layer="950" to-port="1" /> <edge from-layer="950" from-port="2" to-layer="951" to-port="1" /> <edge from-layer="951" from-port="2" to-layer="952" to-port="1" /> <edge from-layer="952" from-port="2" to-layer="955" to-port="0" /> <edge from-layer="953" from-port="0" to-layer="954" to-port="0" /> <edge from-layer="954" from-port="1" to-layer="955" to-port="1" /> <edge from-layer="955" from-port="2" to-layer="959" to-port="0" /> <edge from-layer="955" from-port="2" to-layer="1026" to-port="0" /> <edge from-layer="955" from-port="2" to-layer="992" to-port="0" /> <edge from-layer="956" from-port="0" to-layer="959" to-port="1" /> <edge from-layer="957" from-port="0" to-layer="959" to-port="2" /> <edge from-layer="958" from-port="0" to-layer="959" to-port="3" /> <edge from-layer="959" from-port="5" to-layer="961" to-port="0" /> <edge from-layer="960" from-port="0" to-layer="961" to-port="1" /> <edge from-layer="961" from-port="2" to-layer="963" to-port="0" /> <edge from-layer="962" from-port="0" to-layer="963" to-port="1" /> <edge from-layer="963" from-port="2" to-layer="964" to-port="0" /> <edge from-layer="963" from-port="2" to-layer="975" to-port="0" /> <edge from-layer="963" from-port="2" to-layer="968" to-port="0" /> <edge from-layer="964" from-port="2" to-layer="978" to-port="0" /> <edge from-layer="965" from-port="0" to-layer="968" to-port="1" /> <edge from-layer="966" from-port="0" to-layer="968" to-port="2" /> <edge from-layer="967" from-port="0" to-layer="968" to-port="3" /> <edge from-layer="968" from-port="5" to-layer="971" to-port="0" /> <edge from-layer="969" from-port="0" to-layer="970" to-port="0" /> <edge from-layer="970" from-port="1" to-layer="971" to-port="1" /> <edge from-layer="971" from-port="2" to-layer="976" to-port="0" /> <edge from-layer="972" from-port="0" to-layer="975" to-port="1" /> <edge from-layer="973" from-port="0" to-layer="975" to-port="2" /> <edge from-layer="974" from-port="0" to-layer="975" to-port="3" /> <edge from-layer="975" from-port="5" to-layer="976" to-port="1" /> <edge from-layer="976" from-port="2" to-layer="977" to-port="0" /> <edge from-layer="977" from-port="2" to-layer="978" to-port="1" /> <edge from-layer="978" from-port="2" to-layer="1032" to-port="0" /> <edge from-layer="979" from-port="0" to-layer="980" to-port="0" /> <edge from-layer="980" from-port="1" to-layer="985" to-port="0" /> <edge from-layer="981" from-port="0" to-layer="984" to-port="1" /> <edge from-layer="982" from-port="0" to-layer="984" to-port="2" /> <edge from-layer="983" from-port="0" to-layer="984" to-port="3" /> <edge from-layer="984" from-port="4" to-layer="985" to-port="1" /> <edge from-layer="985" from-port="2" to-layer="986" to-port="0" /> <edge from-layer="986" from-port="1" to-layer="988" to-port="0" /> <edge from-layer="987" from-port="0" to-layer="988" to-port="2" /> <edge from-layer="988" from-port="3" to-layer="1012" to-port="0" /> <edge from-layer="989" from-port="0" to-layer="992" to-port="1" /> <edge from-layer="990" from-port="0" to-layer="992" to-port="2" /> <edge from-layer="991" from-port="0" to-layer="992" to-port="3" /> <edge from-layer="992" from-port="5" to-layer="994" to-port="0" /> <edge from-layer="993" from-port="0" to-layer="994" to-port="1" /> <edge from-layer="994" from-port="2" to-layer="996" to-port="0" /> <edge from-layer="995" from-port="0" to-layer="996" to-port="1" /> <edge from-layer="996" from-port="2" to-layer="997" to-port="0" /> <edge from-layer="996" from-port="2" to-layer="1001" to-port="0" /> <edge from-layer="996" from-port="2" to-layer="1008" to-port="0" /> <edge from-layer="997" from-port="2" to-layer="1011" to-port="0" /> <edge from-layer="998" from-port="0" to-layer="1001" to-port="1" /> <edge from-layer="999" from-port="0" to-layer="1001" to-port="2" /> <edge from-layer="1000" from-port="0" to-layer="1001" to-port="3" /> <edge from-layer="1001" from-port="5" to-layer="1004" to-port="0" /> <edge from-layer="1002" from-port="0" to-layer="1003" to-port="0" /> <edge from-layer="1003" from-port="1" to-layer="1004" to-port="1" /> <edge from-layer="1004" from-port="2" to-layer="1009" to-port="0" /> <edge from-layer="1005" from-port="0" to-layer="1008" to-port="1" /> <edge from-layer="1006" from-port="0" to-layer="1008" to-port="2" /> <edge from-layer="1007" from-port="0" to-layer="1008" to-port="3" /> <edge from-layer="1008" from-port="5" to-layer="1009" to-port="1" /> <edge from-layer="1009" from-port="2" to-layer="1010" to-port="0" /> <edge from-layer="1010" from-port="2" to-layer="1011" to-port="1" /> <edge from-layer="1011" from-port="2" to-layer="1012" to-port="1" /> <edge from-layer="1012" from-port="2" to-layer="1394" to-port="0" /> <edge from-layer="1012" from-port="2" to-layer="1032" to-port="1" /> <edge from-layer="1013" from-port="0" to-layer="1014" to-port="0" /> <edge from-layer="1014" from-port="1" to-layer="1019" to-port="0" /> <edge from-layer="1015" from-port="0" to-layer="1018" to-port="1" /> <edge from-layer="1016" from-port="0" to-layer="1018" to-port="2" /> <edge from-layer="1017" from-port="0" to-layer="1018" to-port="3" /> <edge from-layer="1018" from-port="4" to-layer="1019" to-port="1" /> <edge from-layer="1019" from-port="2" to-layer="1020" to-port="0" /> <edge from-layer="1020" from-port="1" to-layer="1022" to-port="0" /> <edge from-layer="1021" from-port="0" to-layer="1022" to-port="2" /> <edge from-layer="1022" from-port="3" to-layer="1031" to-port="0" /> <edge from-layer="1023" from-port="0" to-layer="1026" to-port="1" /> <edge from-layer="1024" from-port="0" to-layer="1026" to-port="2" /> <edge from-layer="1025" from-port="0" to-layer="1026" to-port="3" /> <edge from-layer="1026" from-port="5" to-layer="1028" to-port="0" /> <edge from-layer="1027" from-port="0" to-layer="1028" to-port="1" /> <edge from-layer="1028" from-port="2" to-layer="1030" to-port="0" /> <edge from-layer="1029" from-port="0" to-layer="1030" to-port="1" /> <edge from-layer="1030" from-port="2" to-layer="1031" to-port="1" /> <edge from-layer="1031" from-port="2" to-layer="1393" to-port="0" /> <edge from-layer="1031" from-port="2" to-layer="1032" to-port="2" /> <edge from-layer="1032" from-port="4" to-layer="1034" to-port="0" /> <edge from-layer="1033" from-port="0" to-layer="1034" to-port="1" /> <edge from-layer="1034" from-port="2" to-layer="1036" to-port="0" /> <edge from-layer="1035" from-port="0" to-layer="1036" to-port="1" /> <edge from-layer="1036" from-port="2" to-layer="1039" to-port="0" /> <edge from-layer="1037" from-port="0" to-layer="1038" to-port="0" /> <edge from-layer="1038" from-port="1" to-layer="1039" to-port="1" /> <edge from-layer="1039" from-port="2" to-layer="1040" to-port="1" /> <edge from-layer="1040" from-port="2" to-layer="1066" to-port="0" /> <edge from-layer="1040" from-port="2" to-layer="1047" to-port="0" /> <edge from-layer="1040" from-port="2" to-layer="1055" to-port="0" /> <edge from-layer="1041" from-port="0" to-layer="1042" to-port="0" /> <edge from-layer="1042" from-port="1" to-layer="1056" to-port="0" /> <edge from-layer="1043" from-port="0" to-layer="1044" to-port="0" /> <edge from-layer="1044" from-port="1" to-layer="1054" to-port="0" /> <edge from-layer="1045" from-port="0" to-layer="1046" to-port="0" /> <edge from-layer="1046" from-port="1" to-layer="1047" to-port="1" /> <edge from-layer="1047" from-port="2" to-layer="1049" to-port="0" /> <edge from-layer="1048" from-port="0" to-layer="1049" to-port="1" /> <edge from-layer="1049" from-port="2" to-layer="1052" to-port="0" /> <edge from-layer="1050" from-port="0" to-layer="1051" to-port="0" /> <edge from-layer="1051" from-port="1" to-layer="1052" to-port="1" /> <edge from-layer="1052" from-port="2" to-layer="1053" to-port="0" /> <edge from-layer="1053" from-port="1" to-layer="1054" to-port="1" /> <edge from-layer="1054" from-port="2" to-layer="1055" to-port="1" /> <edge from-layer="1055" from-port="2" to-layer="1056" to-port="1" /> <edge from-layer="1056" from-port="2" to-layer="1059" to-port="0" /> <edge from-layer="1057" from-port="0" to-layer="1058" to-port="0" /> <edge from-layer="1058" from-port="1" to-layer="1059" to-port="1" /> <edge from-layer="1059" from-port="2" to-layer="1060" to-port="0" /> <edge from-layer="1060" from-port="4" to-layer="1062" to-port="0" /> <edge from-layer="1060" from-port="3" to-layer="1061" to-port="0" /> <edge from-layer="1061" from-port="1" to-layer="1062" to-port="1" /> <edge from-layer="1062" from-port="2" to-layer="1065" to-port="0" /> <edge from-layer="1063" from-port="0" to-layer="1064" to-port="0" /> <edge from-layer="1064" from-port="1" to-layer="1065" to-port="1" /> <edge from-layer="1065" from-port="2" to-layer="1066" to-port="1" /> <edge from-layer="1066" from-port="2" to-layer="1081" to-port="0" /> <edge from-layer="1066" from-port="2" to-layer="1170" to-port="0" /> <edge from-layer="1066" from-port="2" to-layer="1073" to-port="0" /> <edge from-layer="1067" from-port="0" to-layer="1068" to-port="0" /> <edge from-layer="1068" from-port="1" to-layer="1082" to-port="0" /> <edge from-layer="1069" from-port="0" to-layer="1070" to-port="0" /> <edge from-layer="1070" from-port="1" to-layer="1080" to-port="0" /> <edge from-layer="1071" from-port="0" to-layer="1072" to-port="0" /> <edge from-layer="1072" from-port="1" to-layer="1073" to-port="1" /> <edge from-layer="1073" from-port="2" to-layer="1075" to-port="0" /> <edge from-layer="1074" from-port="0" to-layer="1075" to-port="1" /> <edge from-layer="1075" from-port="2" to-layer="1078" to-port="0" /> <edge from-layer="1076" from-port="0" to-layer="1077" to-port="0" /> <edge from-layer="1077" from-port="1" to-layer="1078" to-port="1" /> <edge from-layer="1078" from-port="2" to-layer="1079" to-port="0" /> <edge from-layer="1079" from-port="1" to-layer="1080" to-port="1" /> <edge from-layer="1080" from-port="2" to-layer="1081" to-port="1" /> <edge from-layer="1081" from-port="2" to-layer="1082" to-port="1" /> <edge from-layer="1082" from-port="2" to-layer="1085" to-port="0" /> <edge from-layer="1083" from-port="0" to-layer="1084" to-port="0" /> <edge from-layer="1084" from-port="1" to-layer="1085" to-port="1" /> <edge from-layer="1085" from-port="2" to-layer="1089" to-port="0" /> <edge from-layer="1085" from-port="2" to-layer="1122" to-port="0" /> <edge from-layer="1085" from-port="2" to-layer="1156" to-port="0" /> <edge from-layer="1086" from-port="0" to-layer="1089" to-port="1" /> <edge from-layer="1087" from-port="0" to-layer="1089" to-port="2" /> <edge from-layer="1088" from-port="0" to-layer="1089" to-port="3" /> <edge from-layer="1089" from-port="5" to-layer="1091" to-port="0" /> <edge from-layer="1090" from-port="0" to-layer="1091" to-port="1" /> <edge from-layer="1091" from-port="2" to-layer="1093" to-port="0" /> <edge from-layer="1092" from-port="0" to-layer="1093" to-port="1" /> <edge from-layer="1093" from-port="2" to-layer="1094" to-port="0" /> <edge from-layer="1093" from-port="2" to-layer="1098" to-port="0" /> <edge from-layer="1093" from-port="2" to-layer="1105" to-port="0" /> <edge from-layer="1094" from-port="2" to-layer="1108" to-port="0" /> <edge from-layer="1095" from-port="0" to-layer="1098" to-port="1" /> <edge from-layer="1096" from-port="0" to-layer="1098" to-port="2" /> <edge from-layer="1097" from-port="0" to-layer="1098" to-port="3" /> <edge from-layer="1098" from-port="5" to-layer="1101" to-port="0" /> <edge from-layer="1099" from-port="0" to-layer="1100" to-port="0" /> <edge from-layer="1100" from-port="1" to-layer="1101" to-port="1" /> <edge from-layer="1101" from-port="2" to-layer="1106" to-port="0" /> <edge from-layer="1102" from-port="0" to-layer="1105" to-port="1" /> <edge from-layer="1103" from-port="0" to-layer="1105" to-port="2" /> <edge from-layer="1104" from-port="0" to-layer="1105" to-port="3" /> <edge from-layer="1105" from-port="5" to-layer="1106" to-port="1" /> <edge from-layer="1106" from-port="2" to-layer="1107" to-port="0" /> <edge from-layer="1107" from-port="2" to-layer="1108" to-port="1" /> <edge from-layer="1108" from-port="2" to-layer="1162" to-port="0" /> <edge from-layer="1109" from-port="0" to-layer="1110" to-port="0" /> <edge from-layer="1110" from-port="1" to-layer="1115" to-port="0" /> <edge from-layer="1111" from-port="0" to-layer="1114" to-port="1" /> <edge from-layer="1112" from-port="0" to-layer="1114" to-port="2" /> <edge from-layer="1113" from-port="0" to-layer="1114" to-port="3" /> <edge from-layer="1114" from-port="4" to-layer="1115" to-port="1" /> <edge from-layer="1115" from-port="2" to-layer="1116" to-port="0" /> <edge from-layer="1116" from-port="1" to-layer="1118" to-port="0" /> <edge from-layer="1117" from-port="0" to-layer="1118" to-port="2" /> <edge from-layer="1118" from-port="3" to-layer="1142" to-port="0" /> <edge from-layer="1119" from-port="0" to-layer="1122" to-port="1" /> <edge from-layer="1120" from-port="0" to-layer="1122" to-port="2" /> <edge from-layer="1121" from-port="0" to-layer="1122" to-port="3" /> <edge from-layer="1122" from-port="5" to-layer="1124" to-port="0" /> <edge from-layer="1123" from-port="0" to-layer="1124" to-port="1" /> <edge from-layer="1124" from-port="2" to-layer="1126" to-port="0" /> <edge from-layer="1125" from-port="0" to-layer="1126" to-port="1" /> <edge from-layer="1126" from-port="2" to-layer="1138" to-port="0" /> <edge from-layer="1126" from-port="2" to-layer="1127" to-port="0" /> <edge from-layer="1126" from-port="2" to-layer="1131" to-port="0" /> <edge from-layer="1127" from-port="2" to-layer="1141" to-port="0" /> <edge from-layer="1128" from-port="0" to-layer="1131" to-port="1" /> <edge from-layer="1129" from-port="0" to-layer="1131" to-port="2" /> <edge from-layer="1130" from-port="0" to-layer="1131" to-port="3" /> <edge from-layer="1131" from-port="5" to-layer="1134" to-port="0" /> <edge from-layer="1132" from-port="0" to-layer="1133" to-port="0" /> <edge from-layer="1133" from-port="1" to-layer="1134" to-port="1" /> <edge from-layer="1134" from-port="2" to-layer="1139" to-port="0" /> <edge from-layer="1135" from-port="0" to-layer="1138" to-port="1" /> <edge from-layer="1136" from-port="0" to-layer="1138" to-port="2" /> <edge from-layer="1137" from-port="0" to-layer="1138" to-port="3" /> <edge from-layer="1138" from-port="5" to-layer="1139" to-port="1" /> <edge from-layer="1139" from-port="2" to-layer="1140" to-port="0" /> <edge from-layer="1140" from-port="2" to-layer="1141" to-port="1" /> <edge from-layer="1141" from-port="2" to-layer="1142" to-port="1" /> <edge from-layer="1142" from-port="2" to-layer="1162" to-port="1" /> <edge from-layer="1142" from-port="2" to-layer="1392" to-port="0" /> <edge from-layer="1143" from-port="0" to-layer="1144" to-port="0" /> <edge from-layer="1144" from-port="1" to-layer="1149" to-port="0" /> <edge from-layer="1145" from-port="0" to-layer="1148" to-port="1" /> <edge from-layer="1146" from-port="0" to-layer="1148" to-port="2" /> <edge from-layer="1147" from-port="0" to-layer="1148" to-port="3" /> <edge from-layer="1148" from-port="4" to-layer="1149" to-port="1" /> <edge from-layer="1149" from-port="2" to-layer="1150" to-port="0" /> <edge from-layer="1150" from-port="1" to-layer="1152" to-port="0" /> <edge from-layer="1151" from-port="0" to-layer="1152" to-port="2" /> <edge from-layer="1152" from-port="3" to-layer="1161" to-port="0" /> <edge from-layer="1153" from-port="0" to-layer="1156" to-port="1" /> <edge from-layer="1154" from-port="0" to-layer="1156" to-port="2" /> <edge from-layer="1155" from-port="0" to-layer="1156" to-port="3" /> <edge from-layer="1156" from-port="5" to-layer="1158" to-port="0" /> <edge from-layer="1157" from-port="0" to-layer="1158" to-port="1" /> <edge from-layer="1158" from-port="2" to-layer="1160" to-port="0" /> <edge from-layer="1159" from-port="0" to-layer="1160" to-port="1" /> <edge from-layer="1160" from-port="2" to-layer="1161" to-port="1" /> <edge from-layer="1161" from-port="2" to-layer="1391" to-port="0" /> <edge from-layer="1161" from-port="2" to-layer="1162" to-port="2" /> <edge from-layer="1162" from-port="4" to-layer="1164" to-port="0" /> <edge from-layer="1163" from-port="0" to-layer="1164" to-port="1" /> <edge from-layer="1164" from-port="2" to-layer="1166" to-port="0" /> <edge from-layer="1165" from-port="0" to-layer="1166" to-port="1" /> <edge from-layer="1166" from-port="2" to-layer="1169" to-port="0" /> <edge from-layer="1167" from-port="0" to-layer="1168" to-port="0" /> <edge from-layer="1168" from-port="1" to-layer="1169" to-port="1" /> <edge from-layer="1169" from-port="2" to-layer="1170" to-port="1" /> <edge from-layer="1170" from-port="2" to-layer="1177" to-port="0" /> <edge from-layer="1170" from-port="2" to-layer="1185" to-port="0" /> <edge from-layer="1170" from-port="2" to-layer="1196" to-port="0" /> <edge from-layer="1171" from-port="0" to-layer="1172" to-port="0" /> <edge from-layer="1172" from-port="1" to-layer="1186" to-port="0" /> <edge from-layer="1173" from-port="0" to-layer="1174" to-port="0" /> <edge from-layer="1174" from-port="1" to-layer="1184" to-port="0" /> <edge from-layer="1175" from-port="0" to-layer="1176" to-port="0" /> <edge from-layer="1176" from-port="1" to-layer="1177" to-port="1" /> <edge from-layer="1177" from-port="2" to-layer="1179" to-port="0" /> <edge from-layer="1178" from-port="0" to-layer="1179" to-port="1" /> <edge from-layer="1179" from-port="2" to-layer="1182" to-port="0" /> <edge from-layer="1180" from-port="0" to-layer="1181" to-port="0" /> <edge from-layer="1181" from-port="1" to-layer="1182" to-port="1" /> <edge from-layer="1182" from-port="2" to-layer="1183" to-port="0" /> <edge from-layer="1183" from-port="1" to-layer="1184" to-port="1" /> <edge from-layer="1184" from-port="2" to-layer="1185" to-port="1" /> <edge from-layer="1185" from-port="2" to-layer="1186" to-port="1" /> <edge from-layer="1186" from-port="2" to-layer="1189" to-port="0" /> <edge from-layer="1187" from-port="0" to-layer="1188" to-port="0" /> <edge from-layer="1188" from-port="1" to-layer="1189" to-port="1" /> <edge from-layer="1189" from-port="2" to-layer="1190" to-port="0" /> <edge from-layer="1190" from-port="3" to-layer="1191" to-port="0" /> <edge from-layer="1190" from-port="4" to-layer="1192" to-port="0" /> <edge from-layer="1191" from-port="1" to-layer="1192" to-port="1" /> <edge from-layer="1192" from-port="2" to-layer="1195" to-port="0" /> <edge from-layer="1193" from-port="0" to-layer="1194" to-port="0" /> <edge from-layer="1194" from-port="1" to-layer="1195" to-port="1" /> <edge from-layer="1195" from-port="2" to-layer="1196" to-port="1" /> <edge from-layer="1196" from-port="2" to-layer="1211" to-port="0" /> <edge from-layer="1196" from-port="2" to-layer="1203" to-port="0" /> <edge from-layer="1196" from-port="2" to-layer="1300" to-port="0" /> <edge from-layer="1197" from-port="0" to-layer="1198" to-port="0" /> <edge from-layer="1198" from-port="1" to-layer="1212" to-port="0" /> <edge from-layer="1199" from-port="0" to-layer="1200" to-port="0" /> <edge from-layer="1200" from-port="1" to-layer="1210" to-port="0" /> <edge from-layer="1201" from-port="0" to-layer="1202" to-port="0" /> <edge from-layer="1202" from-port="1" to-layer="1203" to-port="1" /> <edge from-layer="1203" from-port="2" to-layer="1205" to-port="0" /> <edge from-layer="1204" from-port="0" to-layer="1205" to-port="1" /> <edge from-layer="1205" from-port="2" to-layer="1208" to-port="0" /> <edge from-layer="1206" from-port="0" to-layer="1207" to-port="0" /> <edge from-layer="1207" from-port="1" to-layer="1208" to-port="1" /> <edge from-layer="1208" from-port="2" to-layer="1209" to-port="0" /> <edge from-layer="1209" from-port="1" to-layer="1210" to-port="1" /> <edge from-layer="1210" from-port="2" to-layer="1211" to-port="1" /> <edge from-layer="1211" from-port="2" to-layer="1212" to-port="1" /> <edge from-layer="1212" from-port="2" to-layer="1215" to-port="0" /> <edge from-layer="1213" from-port="0" to-layer="1214" to-port="0" /> <edge from-layer="1214" from-port="1" to-layer="1215" to-port="1" /> <edge from-layer="1215" from-port="2" to-layer="1219" to-port="0" /> <edge from-layer="1215" from-port="2" to-layer="1286" to-port="0" /> <edge from-layer="1215" from-port="2" to-layer="1252" to-port="0" /> <edge from-layer="1216" from-port="0" to-layer="1219" to-port="1" /> <edge from-layer="1217" from-port="0" to-layer="1219" to-port="2" /> <edge from-layer="1218" from-port="0" to-layer="1219" to-port="3" /> <edge from-layer="1219" from-port="5" to-layer="1221" to-port="0" /> <edge from-layer="1220" from-port="0" to-layer="1221" to-port="1" /> <edge from-layer="1221" from-port="2" to-layer="1223" to-port="0" /> <edge from-layer="1222" from-port="0" to-layer="1223" to-port="1" /> <edge from-layer="1223" from-port="2" to-layer="1235" to-port="0" /> <edge from-layer="1223" from-port="2" to-layer="1224" to-port="0" /> <edge from-layer="1223" from-port="2" to-layer="1228" to-port="0" /> <edge from-layer="1224" from-port="2" to-layer="1238" to-port="0" /> <edge from-layer="1225" from-port="0" to-layer="1228" to-port="1" /> <edge from-layer="1226" from-port="0" to-layer="1228" to-port="2" /> <edge from-layer="1227" from-port="0" to-layer="1228" to-port="3" /> <edge from-layer="1228" from-port="5" to-layer="1231" to-port="0" /> <edge from-layer="1229" from-port="0" to-layer="1230" to-port="0" /> <edge from-layer="1230" from-port="1" to-layer="1231" to-port="1" /> <edge from-layer="1231" from-port="2" to-layer="1236" to-port="0" /> <edge from-layer="1232" from-port="0" to-layer="1235" to-port="1" /> <edge from-layer="1233" from-port="0" to-layer="1235" to-port="2" /> <edge from-layer="1234" from-port="0" to-layer="1235" to-port="3" /> <edge from-layer="1235" from-port="5" to-layer="1236" to-port="1" /> <edge from-layer="1236" from-port="2" to-layer="1237" to-port="0" /> <edge from-layer="1237" from-port="2" to-layer="1238" to-port="1" /> <edge from-layer="1238" from-port="2" to-layer="1292" to-port="0" /> <edge from-layer="1239" from-port="0" to-layer="1240" to-port="0" /> <edge from-layer="1240" from-port="1" to-layer="1245" to-port="0" /> <edge from-layer="1241" from-port="0" to-layer="1244" to-port="1" /> <edge from-layer="1242" from-port="0" to-layer="1244" to-port="2" /> <edge from-layer="1243" from-port="0" to-layer="1244" to-port="3" /> <edge from-layer="1244" from-port="4" to-layer="1245" to-port="1" /> <edge from-layer="1245" from-port="2" to-layer="1246" to-port="0" /> <edge from-layer="1246" from-port="1" to-layer="1248" to-port="0" /> <edge from-layer="1247" from-port="0" to-layer="1248" to-port="2" /> <edge from-layer="1248" from-port="3" to-layer="1272" to-port="0" /> <edge from-layer="1249" from-port="0" to-layer="1252" to-port="1" /> <edge from-layer="1250" from-port="0" to-layer="1252" to-port="2" /> <edge from-layer="1251" from-port="0" to-layer="1252" to-port="3" /> <edge from-layer="1252" from-port="5" to-layer="1254" to-port="0" /> <edge from-layer="1253" from-port="0" to-layer="1254" to-port="1" /> <edge from-layer="1254" from-port="2" to-layer="1256" to-port="0" /> <edge from-layer="1255" from-port="0" to-layer="1256" to-port="1" /> <edge from-layer="1256" from-port="2" to-layer="1268" to-port="0" /> <edge from-layer="1256" from-port="2" to-layer="1257" to-port="0" /> <edge from-layer="1256" from-port="2" to-layer="1261" to-port="0" /> <edge from-layer="1257" from-port="2" to-layer="1271" to-port="0" /> <edge from-layer="1258" from-port="0" to-layer="1261" to-port="1" /> <edge from-layer="1259" from-port="0" to-layer="1261" to-port="2" /> <edge from-layer="1260" from-port="0" to-layer="1261" to-port="3" /> <edge from-layer="1261" from-port="5" to-layer="1264" to-port="0" /> <edge from-layer="1262" from-port="0" to-layer="1263" to-port="0" /> <edge from-layer="1263" from-port="1" to-layer="1264" to-port="1" /> <edge from-layer="1264" from-port="2" to-layer="1269" to-port="0" /> <edge from-layer="1265" from-port="0" to-layer="1268" to-port="1" /> <edge from-layer="1266" from-port="0" to-layer="1268" to-port="2" /> <edge from-layer="1267" from-port="0" to-layer="1268" to-port="3" /> <edge from-layer="1268" from-port="5" to-layer="1269" to-port="1" /> <edge from-layer="1269" from-port="2" to-layer="1270" to-port="0" /> <edge from-layer="1270" from-port="2" to-layer="1271" to-port="1" /> <edge from-layer="1271" from-port="2" to-layer="1272" to-port="1" /> <edge from-layer="1272" from-port="2" to-layer="1390" to-port="0" /> <edge from-layer="1272" from-port="2" to-layer="1292" to-port="1" /> <edge from-layer="1273" from-port="0" to-layer="1274" to-port="0" /> <edge from-layer="1274" from-port="1" to-layer="1279" to-port="0" /> <edge from-layer="1275" from-port="0" to-layer="1278" to-port="1" /> <edge from-layer="1276" from-port="0" to-layer="1278" to-port="2" /> <edge from-layer="1277" from-port="0" to-layer="1278" to-port="3" /> <edge from-layer="1278" from-port="4" to-layer="1279" to-port="1" /> <edge from-layer="1279" from-port="2" to-layer="1280" to-port="0" /> <edge from-layer="1280" from-port="1" to-layer="1282" to-port="0" /> <edge from-layer="1281" from-port="0" to-layer="1282" to-port="2" /> <edge from-layer="1282" from-port="3" to-layer="1291" to-port="0" /> <edge from-layer="1283" from-port="0" to-layer="1286" to-port="1" /> <edge from-layer="1284" from-port="0" to-layer="1286" to-port="2" /> <edge from-layer="1285" from-port="0" to-layer="1286" to-port="3" /> <edge from-layer="1286" from-port="5" to-layer="1288" to-port="0" /> <edge from-layer="1287" from-port="0" to-layer="1288" to-port="1" /> <edge from-layer="1288" from-port="2" to-layer="1290" to-port="0" /> <edge from-layer="1289" from-port="0" to-layer="1290" to-port="1" /> <edge from-layer="1290" from-port="2" to-layer="1291" to-port="1" /> <edge from-layer="1291" from-port="2" to-layer="1389" to-port="0" /> <edge from-layer="1291" from-port="2" to-layer="1292" to-port="2" /> <edge from-layer="1292" from-port="4" to-layer="1294" to-port="0" /> <edge from-layer="1293" from-port="0" to-layer="1294" to-port="1" /> <edge from-layer="1294" from-port="2" to-layer="1296" to-port="0" /> <edge from-layer="1295" from-port="0" to-layer="1296" to-port="1" /> <edge from-layer="1296" from-port="2" to-layer="1299" to-port="0" /> <edge from-layer="1297" from-port="0" to-layer="1298" to-port="0" /> <edge from-layer="1298" from-port="1" to-layer="1299" to-port="1" /> <edge from-layer="1299" from-port="2" to-layer="1300" to-port="1" /> <edge from-layer="1300" from-port="2" to-layer="1307" to-port="0" /> <edge from-layer="1300" from-port="2" to-layer="1326" to-port="0" /> <edge from-layer="1300" from-port="2" to-layer="1315" to-port="0" /> <edge from-layer="1301" from-port="0" to-layer="1302" to-port="0" /> <edge from-layer="1302" from-port="1" to-layer="1316" to-port="0" /> <edge from-layer="1303" from-port="0" to-layer="1304" to-port="0" /> <edge from-layer="1304" from-port="1" to-layer="1314" to-port="0" /> <edge from-layer="1305" from-port="0" to-layer="1306" to-port="0" /> <edge from-layer="1306" from-port="1" to-layer="1307" to-port="1" /> <edge from-layer="1307" from-port="2" to-layer="1309" to-port="0" /> <edge from-layer="1308" from-port="0" to-layer="1309" to-port="1" /> <edge from-layer="1309" from-port="2" to-layer="1312" to-port="0" /> <edge from-layer="1310" from-port="0" to-layer="1311" to-port="0" /> <edge from-layer="1311" from-port="1" to-layer="1312" to-port="1" /> <edge from-layer="1312" from-port="2" to-layer="1313" to-port="0" /> <edge from-layer="1313" from-port="1" to-layer="1314" to-port="1" /> <edge from-layer="1314" from-port="2" to-layer="1315" to-port="1" /> <edge from-layer="1315" from-port="2" to-layer="1316" to-port="1" /> <edge from-layer="1316" from-port="2" to-layer="1319" to-port="0" /> <edge from-layer="1317" from-port="0" to-layer="1318" to-port="0" /> <edge from-layer="1318" from-port="1" to-layer="1319" to-port="1" /> <edge from-layer="1319" from-port="2" to-layer="1320" to-port="0" /> <edge from-layer="1320" from-port="3" to-layer="1321" to-port="0" /> <edge from-layer="1320" from-port="4" to-layer="1322" to-port="0" /> <edge from-layer="1321" from-port="1" to-layer="1322" to-port="1" /> <edge from-layer="1322" from-port="2" to-layer="1325" to-port="0" /> <edge from-layer="1323" from-port="0" to-layer="1324" to-port="0" /> <edge from-layer="1324" from-port="1" to-layer="1325" to-port="1" /> <edge from-layer="1325" from-port="2" to-layer="1326" to-port="1" /> <edge from-layer="1326" from-port="2" to-layer="1339" to-port="0" /> <edge from-layer="1326" from-port="2" to-layer="1442" to-port="0" /> <edge from-layer="1326" from-port="2" to-layer="1331" to-port="0" /> <edge from-layer="1327" from-port="0" to-layer="1328" to-port="0" /> <edge from-layer="1328" from-port="1" to-layer="1338" to-port="0" /> <edge from-layer="1329" from-port="0" to-layer="1330" to-port="0" /> <edge from-layer="1330" from-port="1" to-layer="1331" to-port="1" /> <edge from-layer="1331" from-port="2" to-layer="1333" to-port="0" /> <edge from-layer="1332" from-port="0" to-layer="1333" to-port="1" /> <edge from-layer="1333" from-port="2" to-layer="1336" to-port="0" /> <edge from-layer="1334" from-port="0" to-layer="1335" to-port="0" /> <edge from-layer="1335" from-port="1" to-layer="1336" to-port="1" /> <edge from-layer="1336" from-port="2" to-layer="1337" to-port="0" /> <edge from-layer="1337" from-port="1" to-layer="1338" to-port="1" /> <edge from-layer="1338" from-port="2" to-layer="1339" to-port="1" /> <edge from-layer="1339" from-port="2" to-layer="1340" to-port="1" /> <edge from-layer="1340" from-port="2" to-layer="1343" to-port="0" /> <edge from-layer="1341" from-port="0" to-layer="1342" to-port="0" /> <edge from-layer="1342" from-port="1" to-layer="1343" to-port="1" /> <edge from-layer="1343" from-port="2" to-layer="1367" to-port="0" /> <edge from-layer="1343" from-port="2" to-layer="1414" to-port="0" /> <edge from-layer="1343" from-port="2" to-layer="1347" to-port="0" /> <edge from-layer="1344" from-port="0" to-layer="1347" to-port="1" /> <edge from-layer="1345" from-port="0" to-layer="1347" to-port="2" /> <edge from-layer="1346" from-port="0" to-layer="1347" to-port="3" /> <edge from-layer="1347" from-port="5" to-layer="1349" to-port="0" /> <edge from-layer="1348" from-port="0" to-layer="1349" to-port="1" /> <edge from-layer="1349" from-port="2" to-layer="1351" to-port="0" /> <edge from-layer="1350" from-port="0" to-layer="1351" to-port="1" /> <edge from-layer="1351" from-port="2" to-layer="1352" to-port="1" /> <edge from-layer="1352" from-port="2" to-layer="1434" to-port="2" /> <edge from-layer="1352" from-port="2" to-layer="1353" to-port="0" /> <edge from-layer="1354" from-port="0" to-layer="1355" to-port="0" /> <edge from-layer="1355" from-port="1" to-layer="1360" to-port="0" /> <edge from-layer="1356" from-port="0" to-layer="1359" to-port="1" /> <edge from-layer="1357" from-port="0" to-layer="1359" to-port="2" /> <edge from-layer="1358" from-port="0" to-layer="1359" to-port="3" /> <edge from-layer="1359" from-port="4" to-layer="1360" to-port="1" /> <edge from-layer="1360" from-port="2" to-layer="1361" to-port="0" /> <edge from-layer="1361" from-port="1" to-layer="1363" to-port="0" /> <edge from-layer="1362" from-port="0" to-layer="1363" to-port="2" /> <edge from-layer="1363" from-port="3" to-layer="1387" to-port="0" /> <edge from-layer="1364" from-port="0" to-layer="1367" to-port="1" /> <edge from-layer="1365" from-port="0" to-layer="1367" to-port="2" /> <edge from-layer="1366" from-port="0" to-layer="1367" to-port="3" /> <edge from-layer="1367" from-port="5" to-layer="1369" to-port="0" /> <edge from-layer="1368" from-port="0" to-layer="1369" to-port="1" /> <edge from-layer="1369" from-port="2" to-layer="1371" to-port="0" /> <edge from-layer="1370" from-port="0" to-layer="1371" to-port="1" /> <edge from-layer="1371" from-port="2" to-layer="1376" to-port="0" /> <edge from-layer="1371" from-port="2" to-layer="1372" to-port="0" /> <edge from-layer="1371" from-port="2" to-layer="1383" to-port="0" /> <edge from-layer="1372" from-port="2" to-layer="1386" to-port="0" /> <edge from-layer="1373" from-port="0" to-layer="1376" to-port="1" /> <edge from-layer="1374" from-port="0" to-layer="1376" to-port="2" /> <edge from-layer="1375" from-port="0" to-layer="1376" to-port="3" /> <edge from-layer="1376" from-port="5" to-layer="1379" to-port="0" /> <edge from-layer="1377" from-port="0" to-layer="1378" to-port="0" /> <edge from-layer="1378" from-port="1" to-layer="1379" to-port="1" /> <edge from-layer="1379" from-port="2" to-layer="1384" to-port="0" /> <edge from-layer="1380" from-port="0" to-layer="1383" to-port="1" /> <edge from-layer="1381" from-port="0" to-layer="1383" to-port="2" /> <edge from-layer="1382" from-port="0" to-layer="1383" to-port="3" /> <edge from-layer="1383" from-port="5" to-layer="1384" to-port="1" /> <edge from-layer="1384" from-port="2" to-layer="1385" to-port="0" /> <edge from-layer="1385" from-port="2" to-layer="1386" to-port="1" /> <edge from-layer="1386" from-port="2" to-layer="1387" to-port="1" /> <edge from-layer="1387" from-port="2" to-layer="1434" to-port="1" /> <edge from-layer="1387" from-port="2" to-layer="1388" to-port="0" /> <edge from-layer="1399" from-port="0" to-layer="1400" to-port="0" /> <edge from-layer="1400" from-port="1" to-layer="1405" to-port="0" /> <edge from-layer="1401" from-port="0" to-layer="1404" to-port="1" /> <edge from-layer="1402" from-port="0" to-layer="1404" to-port="2" /> <edge from-layer="1403" from-port="0" to-layer="1404" to-port="3" /> <edge from-layer="1404" from-port="4" to-layer="1405" to-port="1" /> <edge from-layer="1405" from-port="2" to-layer="1406" to-port="0" /> <edge from-layer="1406" from-port="1" to-layer="1408" to-port="0" /> <edge from-layer="1407" from-port="0" to-layer="1408" to-port="2" /> <edge from-layer="1408" from-port="3" to-layer="4224" to-port="0" /> <edge from-layer="1409" from-port="0" to-layer="1410" to-port="0" /> <edge from-layer="1410" from-port="1" to-layer="4212" to-port="0" /> <edge from-layer="1411" from-port="0" to-layer="1414" to-port="1" /> <edge from-layer="1412" from-port="0" to-layer="1414" to-port="2" /> <edge from-layer="1413" from-port="0" to-layer="1414" to-port="3" /> <edge from-layer="1414" from-port="5" to-layer="1416" to-port="0" /> <edge from-layer="1415" from-port="0" to-layer="1416" to-port="1" /> <edge from-layer="1416" from-port="2" to-layer="1418" to-port="0" /> <edge from-layer="1417" from-port="0" to-layer="1418" to-port="1" /> <edge from-layer="1418" from-port="2" to-layer="1430" to-port="0" /> <edge from-layer="1418" from-port="2" to-layer="1419" to-port="0" /> <edge from-layer="1418" from-port="2" to-layer="1423" to-port="0" /> <edge from-layer="1419" from-port="2" to-layer="1433" to-port="0" /> <edge from-layer="1420" from-port="0" to-layer="1423" to-port="1" /> <edge from-layer="1421" from-port="0" to-layer="1423" to-port="2" /> <edge from-layer="1422" from-port="0" to-layer="1423" to-port="3" /> <edge from-layer="1423" from-port="5" to-layer="1426" to-port="0" /> <edge from-layer="1424" from-port="0" to-layer="1425" to-port="0" /> <edge from-layer="1425" from-port="1" to-layer="1426" to-port="1" /> <edge from-layer="1426" from-port="2" to-layer="1431" to-port="0" /> <edge from-layer="1427" from-port="0" to-layer="1430" to-port="1" /> <edge from-layer="1428" from-port="0" to-layer="1430" to-port="2" /> <edge from-layer="1429" from-port="0" to-layer="1430" to-port="3" /> <edge from-layer="1430" from-port="5" to-layer="1431" to-port="1" /> <edge from-layer="1431" from-port="2" to-layer="1432" to-port="0" /> <edge from-layer="1432" from-port="2" to-layer="1433" to-port="1" /> <edge from-layer="1433" from-port="2" to-layer="1434" to-port="0" /> <edge from-layer="1434" from-port="4" to-layer="1436" to-port="0" /> <edge from-layer="1435" from-port="0" to-layer="1436" to-port="1" /> <edge from-layer="1436" from-port="2" to-layer="1438" to-port="0" /> <edge from-layer="1437" from-port="0" to-layer="1438" to-port="1" /> <edge from-layer="1438" from-port="2" to-layer="1441" to-port="0" /> <edge from-layer="1439" from-port="0" to-layer="1440" to-port="0" /> <edge from-layer="1440" from-port="1" to-layer="1441" to-port="1" /> <edge from-layer="1441" from-port="2" to-layer="1442" to-port="1" /> <edge from-layer="1442" from-port="2" to-layer="1449" to-port="0" /> <edge from-layer="1442" from-port="2" to-layer="1468" to-port="0" /> <edge from-layer="1442" from-port="2" to-layer="1457" to-port="0" /> <edge from-layer="1443" from-port="0" to-layer="1444" to-port="0" /> <edge from-layer="1444" from-port="1" to-layer="1458" to-port="0" /> <edge from-layer="1445" from-port="0" to-layer="1446" to-port="0" /> <edge from-layer="1446" from-port="1" to-layer="1456" to-port="0" /> <edge from-layer="1447" from-port="0" to-layer="1448" to-port="0" /> <edge from-layer="1448" from-port="1" to-layer="1449" to-port="1" /> <edge from-layer="1449" from-port="2" to-layer="1451" to-port="0" /> <edge from-layer="1450" from-port="0" to-layer="1451" to-port="1" /> <edge from-layer="1451" from-port="2" to-layer="1454" to-port="0" /> <edge from-layer="1452" from-port="0" to-layer="1453" to-port="0" /> <edge from-layer="1453" from-port="1" to-layer="1454" to-port="1" /> <edge from-layer="1454" from-port="2" to-layer="1455" to-port="0" /> <edge from-layer="1455" from-port="1" to-layer="1456" to-port="1" /> <edge from-layer="1456" from-port="2" to-layer="1457" to-port="1" /> <edge from-layer="1457" from-port="2" to-layer="1458" to-port="1" /> <edge from-layer="1458" from-port="2" to-layer="1461" to-port="0" /> <edge from-layer="1459" from-port="0" to-layer="1460" to-port="0" /> <edge from-layer="1460" from-port="1" to-layer="1461" to-port="1" /> <edge from-layer="1461" from-port="2" to-layer="1462" to-port="0" /> <edge from-layer="1462" from-port="3" to-layer="1463" to-port="0" /> <edge from-layer="1462" from-port="4" to-layer="1464" to-port="0" /> <edge from-layer="1463" from-port="1" to-layer="1464" to-port="1" /> <edge from-layer="1464" from-port="2" to-layer="1467" to-port="0" /> <edge from-layer="1465" from-port="0" to-layer="1466" to-port="0" /> <edge from-layer="1466" from-port="1" to-layer="1467" to-port="1" /> <edge from-layer="1467" from-port="2" to-layer="1468" to-port="1" /> <edge from-layer="1468" from-port="2" to-layer="1475" to-port="0" /> <edge from-layer="1468" from-port="2" to-layer="1483" to-port="0" /> <edge from-layer="1468" from-port="2" to-layer="1572" to-port="0" /> <edge from-layer="1469" from-port="0" to-layer="1470" to-port="0" /> <edge from-layer="1470" from-port="1" to-layer="1484" to-port="0" /> <edge from-layer="1471" from-port="0" to-layer="1472" to-port="0" /> <edge from-layer="1472" from-port="1" to-layer="1482" to-port="0" /> <edge from-layer="1473" from-port="0" to-layer="1474" to-port="0" /> <edge from-layer="1474" from-port="1" to-layer="1475" to-port="1" /> <edge from-layer="1475" from-port="2" to-layer="1477" to-port="0" /> <edge from-layer="1476" from-port="0" to-layer="1477" to-port="1" /> <edge from-layer="1477" from-port="2" to-layer="1480" to-port="0" /> <edge from-layer="1478" from-port="0" to-layer="1479" to-port="0" /> <edge from-layer="1479" from-port="1" to-layer="1480" to-port="1" /> <edge from-layer="1480" from-port="2" to-layer="1481" to-port="0" /> <edge from-layer="1481" from-port="1" to-layer="1482" to-port="1" /> <edge from-layer="1482" from-port="2" to-layer="1483" to-port="1" /> <edge from-layer="1483" from-port="2" to-layer="1484" to-port="1" /> <edge from-layer="1484" from-port="2" to-layer="1487" to-port="0" /> <edge from-layer="1485" from-port="0" to-layer="1486" to-port="0" /> <edge from-layer="1486" from-port="1" to-layer="1487" to-port="1" /> <edge from-layer="1487" from-port="2" to-layer="1558" to-port="0" /> <edge from-layer="1487" from-port="2" to-layer="1524" to-port="0" /> <edge from-layer="1487" from-port="2" to-layer="1491" to-port="0" /> <edge from-layer="1488" from-port="0" to-layer="1491" to-port="1" /> <edge from-layer="1489" from-port="0" to-layer="1491" to-port="2" /> <edge from-layer="1490" from-port="0" to-layer="1491" to-port="3" /> <edge from-layer="1491" from-port="5" to-layer="1493" to-port="0" /> <edge from-layer="1492" from-port="0" to-layer="1493" to-port="1" /> <edge from-layer="1493" from-port="2" to-layer="1495" to-port="0" /> <edge from-layer="1494" from-port="0" to-layer="1495" to-port="1" /> <edge from-layer="1495" from-port="2" to-layer="1507" to-port="0" /> <edge from-layer="1495" from-port="2" to-layer="1500" to-port="0" /> <edge from-layer="1495" from-port="2" to-layer="1496" to-port="0" /> <edge from-layer="1496" from-port="2" to-layer="1510" to-port="0" /> <edge from-layer="1497" from-port="0" to-layer="1500" to-port="1" /> <edge from-layer="1498" from-port="0" to-layer="1500" to-port="2" /> <edge from-layer="1499" from-port="0" to-layer="1500" to-port="3" /> <edge from-layer="1500" from-port="5" to-layer="1503" to-port="0" /> <edge from-layer="1501" from-port="0" to-layer="1502" to-port="0" /> <edge from-layer="1502" from-port="1" to-layer="1503" to-port="1" /> <edge from-layer="1503" from-port="2" to-layer="1508" to-port="0" /> <edge from-layer="1504" from-port="0" to-layer="1507" to-port="1" /> <edge from-layer="1505" from-port="0" to-layer="1507" to-port="2" /> <edge from-layer="1506" from-port="0" to-layer="1507" to-port="3" /> <edge from-layer="1507" from-port="5" to-layer="1508" to-port="1" /> <edge from-layer="1508" from-port="2" to-layer="1509" to-port="0" /> <edge from-layer="1509" from-port="2" to-layer="1510" to-port="1" /> <edge from-layer="1510" from-port="2" to-layer="1564" to-port="0" /> <edge from-layer="1511" from-port="0" to-layer="1512" to-port="0" /> <edge from-layer="1512" from-port="1" to-layer="1517" to-port="0" /> <edge from-layer="1513" from-port="0" to-layer="1516" to-port="1" /> <edge from-layer="1514" from-port="0" to-layer="1516" to-port="2" /> <edge from-layer="1515" from-port="0" to-layer="1516" to-port="3" /> <edge from-layer="1516" from-port="4" to-layer="1517" to-port="1" /> <edge from-layer="1517" from-port="2" to-layer="1518" to-port="0" /> <edge from-layer="1518" from-port="1" to-layer="1520" to-port="0" /> <edge from-layer="1519" from-port="0" to-layer="1520" to-port="2" /> <edge from-layer="1520" from-port="3" to-layer="1544" to-port="0" /> <edge from-layer="1521" from-port="0" to-layer="1524" to-port="1" /> <edge from-layer="1522" from-port="0" to-layer="1524" to-port="2" /> <edge from-layer="1523" from-port="0" to-layer="1524" to-port="3" /> <edge from-layer="1524" from-port="5" to-layer="1526" to-port="0" /> <edge from-layer="1525" from-port="0" to-layer="1526" to-port="1" /> <edge from-layer="1526" from-port="2" to-layer="1528" to-port="0" /> <edge from-layer="1527" from-port="0" to-layer="1528" to-port="1" /> <edge from-layer="1528" from-port="2" to-layer="1540" to-port="0" /> <edge from-layer="1528" from-port="2" to-layer="1533" to-port="0" /> <edge from-layer="1528" from-port="2" to-layer="1529" to-port="0" /> <edge from-layer="1529" from-port="2" to-layer="1543" to-port="0" /> <edge from-layer="1530" from-port="0" to-layer="1533" to-port="1" /> <edge from-layer="1531" from-port="0" to-layer="1533" to-port="2" /> <edge from-layer="1532" from-port="0" to-layer="1533" to-port="3" /> <edge from-layer="1533" from-port="5" to-layer="1536" to-port="0" /> <edge from-layer="1534" from-port="0" to-layer="1535" to-port="0" /> <edge from-layer="1535" from-port="1" to-layer="1536" to-port="1" /> <edge from-layer="1536" from-port="2" to-layer="1541" to-port="0" /> <edge from-layer="1537" from-port="0" to-layer="1540" to-port="1" /> <edge from-layer="1538" from-port="0" to-layer="1540" to-port="2" /> <edge from-layer="1539" from-port="0" to-layer="1540" to-port="3" /> <edge from-layer="1540" from-port="5" to-layer="1541" to-port="1" /> <edge from-layer="1541" from-port="2" to-layer="1542" to-port="0" /> <edge from-layer="1542" from-port="2" to-layer="1543" to-port="1" /> <edge from-layer="1543" from-port="2" to-layer="1544" to-port="1" /> <edge from-layer="1544" from-port="2" to-layer="1564" to-port="1" /> <edge from-layer="1544" from-port="2" to-layer="4306" to-port="0" /> <edge from-layer="1545" from-port="0" to-layer="1546" to-port="0" /> <edge from-layer="1546" from-port="1" to-layer="1551" to-port="0" /> <edge from-layer="1547" from-port="0" to-layer="1550" to-port="1" /> <edge from-layer="1548" from-port="0" to-layer="1550" to-port="2" /> <edge from-layer="1549" from-port="0" to-layer="1550" to-port="3" /> <edge from-layer="1550" from-port="4" to-layer="1551" to-port="1" /> <edge from-layer="1551" from-port="2" to-layer="1552" to-port="0" /> <edge from-layer="1552" from-port="1" to-layer="1554" to-port="0" /> <edge from-layer="1553" from-port="0" to-layer="1554" to-port="2" /> <edge from-layer="1554" from-port="3" to-layer="1563" to-port="0" /> <edge from-layer="1555" from-port="0" to-layer="1558" to-port="1" /> <edge from-layer="1556" from-port="0" to-layer="1558" to-port="2" /> <edge from-layer="1557" from-port="0" to-layer="1558" to-port="3" /> <edge from-layer="1558" from-port="5" to-layer="1560" to-port="0" /> <edge from-layer="1559" from-port="0" to-layer="1560" to-port="1" /> <edge from-layer="1560" from-port="2" to-layer="1562" to-port="0" /> <edge from-layer="1561" from-port="0" to-layer="1562" to-port="1" /> <edge from-layer="1562" from-port="2" to-layer="1563" to-port="1" /> <edge from-layer="1563" from-port="2" to-layer="1564" to-port="2" /> <edge from-layer="1563" from-port="2" to-layer="4305" to-port="0" /> <edge from-layer="1564" from-port="4" to-layer="1566" to-port="0" /> <edge from-layer="1565" from-port="0" to-layer="1566" to-port="1" /> <edge from-layer="1566" from-port="2" to-layer="1568" to-port="0" /> <edge from-layer="1567" from-port="0" to-layer="1568" to-port="1" /> <edge from-layer="1568" from-port="2" to-layer="1571" to-port="0" /> <edge from-layer="1569" from-port="0" to-layer="1570" to-port="0" /> <edge from-layer="1570" from-port="1" to-layer="1571" to-port="1" /> <edge from-layer="1571" from-port="2" to-layer="1572" to-port="1" /> <edge from-layer="1572" from-port="2" to-layer="1598" to-port="0" /> <edge from-layer="1572" from-port="2" to-layer="1579" to-port="0" /> <edge from-layer="1572" from-port="2" to-layer="1587" to-port="0" /> <edge from-layer="1573" from-port="0" to-layer="1574" to-port="0" /> <edge from-layer="1574" from-port="1" to-layer="1588" to-port="0" /> <edge from-layer="1575" from-port="0" to-layer="1576" to-port="0" /> <edge from-layer="1576" from-port="1" to-layer="1586" to-port="0" /> <edge from-layer="1577" from-port="0" to-layer="1578" to-port="0" /> <edge from-layer="1578" from-port="1" to-layer="1579" to-port="1" /> <edge from-layer="1579" from-port="2" to-layer="1581" to-port="0" /> <edge from-layer="1580" from-port="0" to-layer="1581" to-port="1" /> <edge from-layer="1581" from-port="2" to-layer="1584" to-port="0" /> <edge from-layer="1582" from-port="0" to-layer="1583" to-port="0" /> <edge from-layer="1583" from-port="1" to-layer="1584" to-port="1" /> <edge from-layer="1584" from-port="2" to-layer="1585" to-port="0" /> <edge from-layer="1585" from-port="1" to-layer="1586" to-port="1" /> <edge from-layer="1586" from-port="2" to-layer="1587" to-port="1" /> <edge from-layer="1587" from-port="2" to-layer="1588" to-port="1" /> <edge from-layer="1588" from-port="2" to-layer="1591" to-port="0" /> <edge from-layer="1589" from-port="0" to-layer="1590" to-port="0" /> <edge from-layer="1590" from-port="1" to-layer="1591" to-port="1" /> <edge from-layer="1591" from-port="2" to-layer="1592" to-port="0" /> <edge from-layer="1592" from-port="4" to-layer="1594" to-port="0" /> <edge from-layer="1592" from-port="3" to-layer="1593" to-port="0" /> <edge from-layer="1593" from-port="1" to-layer="1594" to-port="1" /> <edge from-layer="1594" from-port="2" to-layer="1597" to-port="0" /> <edge from-layer="1595" from-port="0" to-layer="1596" to-port="0" /> <edge from-layer="1596" from-port="1" to-layer="1597" to-port="1" /> <edge from-layer="1597" from-port="2" to-layer="1598" to-port="1" /> <edge from-layer="1598" from-port="2" to-layer="1702" to-port="0" /> <edge from-layer="1598" from-port="2" to-layer="1605" to-port="0" /> <edge from-layer="1598" from-port="2" to-layer="1613" to-port="0" /> <edge from-layer="1599" from-port="0" to-layer="1600" to-port="0" /> <edge from-layer="1600" from-port="1" to-layer="1614" to-port="0" /> <edge from-layer="1601" from-port="0" to-layer="1602" to-port="0" /> <edge from-layer="1602" from-port="1" to-layer="1612" to-port="0" /> <edge from-layer="1603" from-port="0" to-layer="1604" to-port="0" /> <edge from-layer="1604" from-port="1" to-layer="1605" to-port="1" /> <edge from-layer="1605" from-port="2" to-layer="1607" to-port="0" /> <edge from-layer="1606" from-port="0" to-layer="1607" to-port="1" /> <edge from-layer="1607" from-port="2" to-layer="1610" to-port="0" /> <edge from-layer="1608" from-port="0" to-layer="1609" to-port="0" /> <edge from-layer="1609" from-port="1" to-layer="1610" to-port="1" /> <edge from-layer="1610" from-port="2" to-layer="1611" to-port="0" /> <edge from-layer="1611" from-port="1" to-layer="1612" to-port="1" /> <edge from-layer="1612" from-port="2" to-layer="1613" to-port="1" /> <edge from-layer="1613" from-port="2" to-layer="1614" to-port="1" /> <edge from-layer="1614" from-port="2" to-layer="1617" to-port="0" /> <edge from-layer="1615" from-port="0" to-layer="1616" to-port="0" /> <edge from-layer="1616" from-port="1" to-layer="1617" to-port="1" /> <edge from-layer="1617" from-port="2" to-layer="1688" to-port="0" /> <edge from-layer="1617" from-port="2" to-layer="1654" to-port="0" /> <edge from-layer="1617" from-port="2" to-layer="1621" to-port="0" /> <edge from-layer="1618" from-port="0" to-layer="1621" to-port="1" /> <edge from-layer="1619" from-port="0" to-layer="1621" to-port="2" /> <edge from-layer="1620" from-port="0" to-layer="1621" to-port="3" /> <edge from-layer="1621" from-port="5" to-layer="1623" to-port="0" /> <edge from-layer="1622" from-port="0" to-layer="1623" to-port="1" /> <edge from-layer="1623" from-port="2" to-layer="1625" to-port="0" /> <edge from-layer="1624" from-port="0" to-layer="1625" to-port="1" /> <edge from-layer="1625" from-port="2" to-layer="1626" to-port="0" /> <edge from-layer="1625" from-port="2" to-layer="1630" to-port="0" /> <edge from-layer="1625" from-port="2" to-layer="1637" to-port="0" /> <edge from-layer="1626" from-port="2" to-layer="1640" to-port="0" /> <edge from-layer="1627" from-port="0" to-layer="1630" to-port="1" /> <edge from-layer="1628" from-port="0" to-layer="1630" to-port="2" /> <edge from-layer="1629" from-port="0" to-layer="1630" to-port="3" /> <edge from-layer="1630" from-port="5" to-layer="1633" to-port="0" /> <edge from-layer="1631" from-port="0" to-layer="1632" to-port="0" /> <edge from-layer="1632" from-port="1" to-layer="1633" to-port="1" /> <edge from-layer="1633" from-port="2" to-layer="1638" to-port="0" /> <edge from-layer="1634" from-port="0" to-layer="1637" to-port="1" /> <edge from-layer="1635" from-port="0" to-layer="1637" to-port="2" /> <edge from-layer="1636" from-port="0" to-layer="1637" to-port="3" /> <edge from-layer="1637" from-port="5" to-layer="1638" to-port="1" /> <edge from-layer="1638" from-port="2" to-layer="1639" to-port="0" /> <edge from-layer="1639" from-port="2" to-layer="1640" to-port="1" /> <edge from-layer="1640" from-port="2" to-layer="1694" to-port="0" /> <edge from-layer="1641" from-port="0" to-layer="1642" to-port="0" /> <edge from-layer="1642" from-port="1" to-layer="1647" to-port="0" /> <edge from-layer="1643" from-port="0" to-layer="1646" to-port="1" /> <edge from-layer="1644" from-port="0" to-layer="1646" to-port="2" /> <edge from-layer="1645" from-port="0" to-layer="1646" to-port="3" /> <edge from-layer="1646" from-port="4" to-layer="1647" to-port="1" /> <edge from-layer="1647" from-port="2" to-layer="1648" to-port="0" /> <edge from-layer="1648" from-port="1" to-layer="1650" to-port="0" /> <edge from-layer="1649" from-port="0" to-layer="1650" to-port="2" /> <edge from-layer="1650" from-port="3" to-layer="1674" to-port="0" /> <edge from-layer="1651" from-port="0" to-layer="1654" to-port="1" /> <edge from-layer="1652" from-port="0" to-layer="1654" to-port="2" /> <edge from-layer="1653" from-port="0" to-layer="1654" to-port="3" /> <edge from-layer="1654" from-port="5" to-layer="1656" to-port="0" /> <edge from-layer="1655" from-port="0" to-layer="1656" to-port="1" /> <edge from-layer="1656" from-port="2" to-layer="1658" to-port="0" /> <edge from-layer="1657" from-port="0" to-layer="1658" to-port="1" /> <edge from-layer="1658" from-port="2" to-layer="1659" to-port="0" /> <edge from-layer="1658" from-port="2" to-layer="1663" to-port="0" /> <edge from-layer="1658" from-port="2" to-layer="1670" to-port="0" /> <edge from-layer="1659" from-port="2" to-layer="1673" to-port="0" /> <edge from-layer="1660" from-port="0" to-layer="1663" to-port="1" /> <edge from-layer="1661" from-port="0" to-layer="1663" to-port="2" /> <edge from-layer="1662" from-port="0" to-layer="1663" to-port="3" /> <edge from-layer="1663" from-port="5" to-layer="1666" to-port="0" /> <edge from-layer="1664" from-port="0" to-layer="1665" to-port="0" /> <edge from-layer="1665" from-port="1" to-layer="1666" to-port="1" /> <edge from-layer="1666" from-port="2" to-layer="1671" to-port="0" /> <edge from-layer="1667" from-port="0" to-layer="1670" to-port="1" /> <edge from-layer="1668" from-port="0" to-layer="1670" to-port="2" /> <edge from-layer="1669" from-port="0" to-layer="1670" to-port="3" /> <edge from-layer="1670" from-port="5" to-layer="1671" to-port="1" /> <edge from-layer="1671" from-port="2" to-layer="1672" to-port="0" /> <edge from-layer="1672" from-port="2" to-layer="1673" to-port="1" /> <edge from-layer="1673" from-port="2" to-layer="1674" to-port="1" /> <edge from-layer="1674" from-port="2" to-layer="1694" to-port="1" /> <edge from-layer="1674" from-port="2" to-layer="4304" to-port="0" /> <edge from-layer="1675" from-port="0" to-layer="1676" to-port="0" /> <edge from-layer="1676" from-port="1" to-layer="1681" to-port="0" /> <edge from-layer="1677" from-port="0" to-layer="1680" to-port="1" /> <edge from-layer="1678" from-port="0" to-layer="1680" to-port="2" /> <edge from-layer="1679" from-port="0" to-layer="1680" to-port="3" /> <edge from-layer="1680" from-port="4" to-layer="1681" to-port="1" /> <edge from-layer="1681" from-port="2" to-layer="1682" to-port="0" /> <edge from-layer="1682" from-port="1" to-layer="1684" to-port="0" /> <edge from-layer="1683" from-port="0" to-layer="1684" to-port="2" /> <edge from-layer="1684" from-port="3" to-layer="1693" to-port="0" /> <edge from-layer="1685" from-port="0" to-layer="1688" to-port="1" /> <edge from-layer="1686" from-port="0" to-layer="1688" to-port="2" /> <edge from-layer="1687" from-port="0" to-layer="1688" to-port="3" /> <edge from-layer="1688" from-port="5" to-layer="1690" to-port="0" /> <edge from-layer="1689" from-port="0" to-layer="1690" to-port="1" /> <edge from-layer="1690" from-port="2" to-layer="1692" to-port="0" /> <edge from-layer="1691" from-port="0" to-layer="1692" to-port="1" /> <edge from-layer="1692" from-port="2" to-layer="1693" to-port="1" /> <edge from-layer="1693" from-port="2" to-layer="1694" to-port="2" /> <edge from-layer="1693" from-port="2" to-layer="4303" to-port="0" /> <edge from-layer="1694" from-port="4" to-layer="1696" to-port="0" /> <edge from-layer="1695" from-port="0" to-layer="1696" to-port="1" /> <edge from-layer="1696" from-port="2" to-layer="1698" to-port="0" /> <edge from-layer="1697" from-port="0" to-layer="1698" to-port="1" /> <edge from-layer="1698" from-port="2" to-layer="1701" to-port="0" /> <edge from-layer="1699" from-port="0" to-layer="1700" to-port="0" /> <edge from-layer="1700" from-port="1" to-layer="1701" to-port="1" /> <edge from-layer="1701" from-port="2" to-layer="1702" to-port="1" /> <edge from-layer="1702" from-port="2" to-layer="1709" to-port="0" /> <edge from-layer="1702" from-port="2" to-layer="1728" to-port="0" /> <edge from-layer="1702" from-port="2" to-layer="1717" to-port="0" /> <edge from-layer="1703" from-port="0" to-layer="1704" to-port="0" /> <edge from-layer="1704" from-port="1" to-layer="1718" to-port="0" /> <edge from-layer="1705" from-port="0" to-layer="1706" to-port="0" /> <edge from-layer="1706" from-port="1" to-layer="1716" to-port="0" /> <edge from-layer="1707" from-port="0" to-layer="1708" to-port="0" /> <edge from-layer="1708" from-port="1" to-layer="1709" to-port="1" /> <edge from-layer="1709" from-port="2" to-layer="1711" to-port="0" /> <edge from-layer="1710" from-port="0" to-layer="1711" to-port="1" /> <edge from-layer="1711" from-port="2" to-layer="1714" to-port="0" /> <edge from-layer="1712" from-port="0" to-layer="1713" to-port="0" /> <edge from-layer="1713" from-port="1" to-layer="1714" to-port="1" /> <edge from-layer="1714" from-port="2" to-layer="1715" to-port="0" /> <edge from-layer="1715" from-port="1" to-layer="1716" to-port="1" /> <edge from-layer="1716" from-port="2" to-layer="1717" to-port="1" /> <edge from-layer="1717" from-port="2" to-layer="1718" to-port="1" /> <edge from-layer="1718" from-port="2" to-layer="1721" to-port="0" /> <edge from-layer="1719" from-port="0" to-layer="1720" to-port="0" /> <edge from-layer="1720" from-port="1" to-layer="1721" to-port="1" /> <edge from-layer="1721" from-port="2" to-layer="1722" to-port="0" /> <edge from-layer="1722" from-port="3" to-layer="1723" to-port="0" /> <edge from-layer="1722" from-port="4" to-layer="1724" to-port="0" /> <edge from-layer="1723" from-port="1" to-layer="1724" to-port="1" /> <edge from-layer="1724" from-port="2" to-layer="1727" to-port="0" /> <edge from-layer="1725" from-port="0" to-layer="1726" to-port="0" /> <edge from-layer="1726" from-port="1" to-layer="1727" to-port="1" /> <edge from-layer="1727" from-port="2" to-layer="1728" to-port="1" /> <edge from-layer="1728" from-port="2" to-layer="1832" to-port="0" /> <edge from-layer="1728" from-port="2" to-layer="1735" to-port="0" /> <edge from-layer="1728" from-port="2" to-layer="1743" to-port="0" /> <edge from-layer="1729" from-port="0" to-layer="1730" to-port="0" /> <edge from-layer="1730" from-port="1" to-layer="1744" to-port="0" /> <edge from-layer="1731" from-port="0" to-layer="1732" to-port="0" /> <edge from-layer="1732" from-port="1" to-layer="1742" to-port="0" /> <edge from-layer="1733" from-port="0" to-layer="1734" to-port="0" /> <edge from-layer="1734" from-port="1" to-layer="1735" to-port="1" /> <edge from-layer="1735" from-port="2" to-layer="1737" to-port="0" /> <edge from-layer="1736" from-port="0" to-layer="1737" to-port="1" /> <edge from-layer="1737" from-port="2" to-layer="1740" to-port="0" /> <edge from-layer="1738" from-port="0" to-layer="1739" to-port="0" /> <edge from-layer="1739" from-port="1" to-layer="1740" to-port="1" /> <edge from-layer="1740" from-port="2" to-layer="1741" to-port="0" /> <edge from-layer="1741" from-port="1" to-layer="1742" to-port="1" /> <edge from-layer="1742" from-port="2" to-layer="1743" to-port="1" /> <edge from-layer="1743" from-port="2" to-layer="1744" to-port="1" /> <edge from-layer="1744" from-port="2" to-layer="1747" to-port="0" /> <edge from-layer="1745" from-port="0" to-layer="1746" to-port="0" /> <edge from-layer="1746" from-port="1" to-layer="1747" to-port="1" /> <edge from-layer="1747" from-port="2" to-layer="1818" to-port="0" /> <edge from-layer="1747" from-port="2" to-layer="1784" to-port="0" /> <edge from-layer="1747" from-port="2" to-layer="1751" to-port="0" /> <edge from-layer="1748" from-port="0" to-layer="1751" to-port="1" /> <edge from-layer="1749" from-port="0" to-layer="1751" to-port="2" /> <edge from-layer="1750" from-port="0" to-layer="1751" to-port="3" /> <edge from-layer="1751" from-port="5" to-layer="1753" to-port="0" /> <edge from-layer="1752" from-port="0" to-layer="1753" to-port="1" /> <edge from-layer="1753" from-port="2" to-layer="1755" to-port="0" /> <edge from-layer="1754" from-port="0" to-layer="1755" to-port="1" /> <edge from-layer="1755" from-port="2" to-layer="1756" to-port="0" /> <edge from-layer="1755" from-port="2" to-layer="1760" to-port="0" /> <edge from-layer="1755" from-port="2" to-layer="1767" to-port="0" /> <edge from-layer="1756" from-port="2" to-layer="1770" to-port="0" /> <edge from-layer="1757" from-port="0" to-layer="1760" to-port="1" /> <edge from-layer="1758" from-port="0" to-layer="1760" to-port="2" /> <edge from-layer="1759" from-port="0" to-layer="1760" to-port="3" /> <edge from-layer="1760" from-port="5" to-layer="1763" to-port="0" /> <edge from-layer="1761" from-port="0" to-layer="1762" to-port="0" /> <edge from-layer="1762" from-port="1" to-layer="1763" to-port="1" /> <edge from-layer="1763" from-port="2" to-layer="1768" to-port="0" /> <edge from-layer="1764" from-port="0" to-layer="1767" to-port="1" /> <edge from-layer="1765" from-port="0" to-layer="1767" to-port="2" /> <edge from-layer="1766" from-port="0" to-layer="1767" to-port="3" /> <edge from-layer="1767" from-port="5" to-layer="1768" to-port="1" /> <edge from-layer="1768" from-port="2" to-layer="1769" to-port="0" /> <edge from-layer="1769" from-port="2" to-layer="1770" to-port="1" /> <edge from-layer="1770" from-port="2" to-layer="1824" to-port="0" /> <edge from-layer="1771" from-port="0" to-layer="1772" to-port="0" /> <edge from-layer="1772" from-port="1" to-layer="1777" to-port="0" /> <edge from-layer="1773" from-port="0" to-layer="1776" to-port="1" /> <edge from-layer="1774" from-port="0" to-layer="1776" to-port="2" /> <edge from-layer="1775" from-port="0" to-layer="1776" to-port="3" /> <edge from-layer="1776" from-port="4" to-layer="1777" to-port="1" /> <edge from-layer="1777" from-port="2" to-layer="1778" to-port="0" /> <edge from-layer="1778" from-port="1" to-layer="1780" to-port="0" /> <edge from-layer="1779" from-port="0" to-layer="1780" to-port="2" /> <edge from-layer="1780" from-port="3" to-layer="1804" to-port="0" /> <edge from-layer="1781" from-port="0" to-layer="1784" to-port="1" /> <edge from-layer="1782" from-port="0" to-layer="1784" to-port="2" /> <edge from-layer="1783" from-port="0" to-layer="1784" to-port="3" /> <edge from-layer="1784" from-port="5" to-layer="1786" to-port="0" /> <edge from-layer="1785" from-port="0" to-layer="1786" to-port="1" /> <edge from-layer="1786" from-port="2" to-layer="1788" to-port="0" /> <edge from-layer="1787" from-port="0" to-layer="1788" to-port="1" /> <edge from-layer="1788" from-port="2" to-layer="1789" to-port="0" /> <edge from-layer="1788" from-port="2" to-layer="1793" to-port="0" /> <edge from-layer="1788" from-port="2" to-layer="1800" to-port="0" /> <edge from-layer="1789" from-port="2" to-layer="1803" to-port="0" /> <edge from-layer="1790" from-port="0" to-layer="1793" to-port="1" /> <edge from-layer="1791" from-port="0" to-layer="1793" to-port="2" /> <edge from-layer="1792" from-port="0" to-layer="1793" to-port="3" /> <edge from-layer="1793" from-port="5" to-layer="1796" to-port="0" /> <edge from-layer="1794" from-port="0" to-layer="1795" to-port="0" /> <edge from-layer="1795" from-port="1" to-layer="1796" to-port="1" /> <edge from-layer="1796" from-port="2" to-layer="1801" to-port="0" /> <edge from-layer="1797" from-port="0" to-layer="1800" to-port="1" /> <edge from-layer="1798" from-port="0" to-layer="1800" to-port="2" /> <edge from-layer="1799" from-port="0" to-layer="1800" to-port="3" /> <edge from-layer="1800" from-port="5" to-layer="1801" to-port="1" /> <edge from-layer="1801" from-port="2" to-layer="1802" to-port="0" /> <edge from-layer="1802" from-port="2" to-layer="1803" to-port="1" /> <edge from-layer="1803" from-port="2" to-layer="1804" to-port="1" /> <edge from-layer="1804" from-port="2" to-layer="4302" to-port="0" /> <edge from-layer="1804" from-port="2" to-layer="1824" to-port="1" /> <edge from-layer="1805" from-port="0" to-layer="1806" to-port="0" /> <edge from-layer="1806" from-port="1" to-layer="1811" to-port="0" /> <edge from-layer="1807" from-port="0" to-layer="1810" to-port="1" /> <edge from-layer="1808" from-port="0" to-layer="1810" to-port="2" /> <edge from-layer="1809" from-port="0" to-layer="1810" to-port="3" /> <edge from-layer="1810" from-port="4" to-layer="1811" to-port="1" /> <edge from-layer="1811" from-port="2" to-layer="1812" to-port="0" /> <edge from-layer="1812" from-port="1" to-layer="1814" to-port="0" /> <edge from-layer="1813" from-port="0" to-layer="1814" to-port="2" /> <edge from-layer="1814" from-port="3" to-layer="1823" to-port="0" /> <edge from-layer="1815" from-port="0" to-layer="1818" to-port="1" /> <edge from-layer="1816" from-port="0" to-layer="1818" to-port="2" /> <edge from-layer="1817" from-port="0" to-layer="1818" to-port="3" /> <edge from-layer="1818" from-port="5" to-layer="1820" to-port="0" /> <edge from-layer="1819" from-port="0" to-layer="1820" to-port="1" /> <edge from-layer="1820" from-port="2" to-layer="1822" to-port="0" /> <edge from-layer="1821" from-port="0" to-layer="1822" to-port="1" /> <edge from-layer="1822" from-port="2" to-layer="1823" to-port="1" /> <edge from-layer="1823" from-port="2" to-layer="4301" to-port="0" /> <edge from-layer="1823" from-port="2" to-layer="1824" to-port="2" /> <edge from-layer="1824" from-port="4" to-layer="1826" to-port="0" /> <edge from-layer="1825" from-port="0" to-layer="1826" to-port="1" /> <edge from-layer="1826" from-port="2" to-layer="1828" to-port="0" /> <edge from-layer="1827" from-port="0" to-layer="1828" to-port="1" /> <edge from-layer="1828" from-port="2" to-layer="1831" to-port="0" /> <edge from-layer="1829" from-port="0" to-layer="1830" to-port="0" /> <edge from-layer="1830" from-port="1" to-layer="1831" to-port="1" /> <edge from-layer="1831" from-port="2" to-layer="1832" to-port="1" /> <edge from-layer="1832" from-port="2" to-layer="1847" to-port="0" /> <edge from-layer="1832" from-port="2" to-layer="1858" to-port="0" /> <edge from-layer="1832" from-port="2" to-layer="1839" to-port="0" /> <edge from-layer="1833" from-port="0" to-layer="1834" to-port="0" /> <edge from-layer="1834" from-port="1" to-layer="1848" to-port="0" /> <edge from-layer="1835" from-port="0" to-layer="1836" to-port="0" /> <edge from-layer="1836" from-port="1" to-layer="1846" to-port="0" /> <edge from-layer="1837" from-port="0" to-layer="1838" to-port="0" /> <edge from-layer="1838" from-port="1" to-layer="1839" to-port="1" /> <edge from-layer="1839" from-port="2" to-layer="1841" to-port="0" /> <edge from-layer="1840" from-port="0" to-layer="1841" to-port="1" /> <edge from-layer="1841" from-port="2" to-layer="1844" to-port="0" /> <edge from-layer="1842" from-port="0" to-layer="1843" to-port="0" /> <edge from-layer="1843" from-port="1" to-layer="1844" to-port="1" /> <edge from-layer="1844" from-port="2" to-layer="1845" to-port="0" /> <edge from-layer="1845" from-port="1" to-layer="1846" to-port="1" /> <edge from-layer="1846" from-port="2" to-layer="1847" to-port="1" /> <edge from-layer="1847" from-port="2" to-layer="1848" to-port="1" /> <edge from-layer="1848" from-port="2" to-layer="1851" to-port="0" /> <edge from-layer="1849" from-port="0" to-layer="1850" to-port="0" /> <edge from-layer="1850" from-port="1" to-layer="1851" to-port="1" /> <edge from-layer="1851" from-port="2" to-layer="1852" to-port="0" /> <edge from-layer="1852" from-port="3" to-layer="1853" to-port="0" /> <edge from-layer="1852" from-port="4" to-layer="1854" to-port="0" /> <edge from-layer="1853" from-port="1" to-layer="1854" to-port="1" /> <edge from-layer="1854" from-port="2" to-layer="1857" to-port="0" /> <edge from-layer="1855" from-port="0" to-layer="1856" to-port="0" /> <edge from-layer="1856" from-port="1" to-layer="1857" to-port="1" /> <edge from-layer="1857" from-port="2" to-layer="1858" to-port="1" /> <edge from-layer="1858" from-port="2" to-layer="1873" to-port="0" /> <edge from-layer="1858" from-port="2" to-layer="1865" to-port="0" /> <edge from-layer="1858" from-port="2" to-layer="1962" to-port="0" /> <edge from-layer="1859" from-port="0" to-layer="1860" to-port="0" /> <edge from-layer="1860" from-port="1" to-layer="1874" to-port="0" /> <edge from-layer="1861" from-port="0" to-layer="1862" to-port="0" /> <edge from-layer="1862" from-port="1" to-layer="1872" to-port="0" /> <edge from-layer="1863" from-port="0" to-layer="1864" to-port="0" /> <edge from-layer="1864" from-port="1" to-layer="1865" to-port="1" /> <edge from-layer="1865" from-port="2" to-layer="1867" to-port="0" /> <edge from-layer="1866" from-port="0" to-layer="1867" to-port="1" /> <edge from-layer="1867" from-port="2" to-layer="1870" to-port="0" /> <edge from-layer="1868" from-port="0" to-layer="1869" to-port="0" /> <edge from-layer="1869" from-port="1" to-layer="1870" to-port="1" /> <edge from-layer="1870" from-port="2" to-layer="1871" to-port="0" /> <edge from-layer="1871" from-port="1" to-layer="1872" to-port="1" /> <edge from-layer="1872" from-port="2" to-layer="1873" to-port="1" /> <edge from-layer="1873" from-port="2" to-layer="1874" to-port="1" /> <edge from-layer="1874" from-port="2" to-layer="1877" to-port="0" /> <edge from-layer="1875" from-port="0" to-layer="1876" to-port="0" /> <edge from-layer="1876" from-port="1" to-layer="1877" to-port="1" /> <edge from-layer="1877" from-port="2" to-layer="1881" to-port="0" /> <edge from-layer="1877" from-port="2" to-layer="1948" to-port="0" /> <edge from-layer="1877" from-port="2" to-layer="1914" to-port="0" /> <edge from-layer="1878" from-port="0" to-layer="1881" to-port="1" /> <edge from-layer="1879" from-port="0" to-layer="1881" to-port="2" /> <edge from-layer="1880" from-port="0" to-layer="1881" to-port="3" /> <edge from-layer="1881" from-port="5" to-layer="1883" to-port="0" /> <edge from-layer="1882" from-port="0" to-layer="1883" to-port="1" /> <edge from-layer="1883" from-port="2" to-layer="1885" to-port="0" /> <edge from-layer="1884" from-port="0" to-layer="1885" to-port="1" /> <edge from-layer="1885" from-port="2" to-layer="1897" to-port="0" /> <edge from-layer="1885" from-port="2" to-layer="1890" to-port="0" /> <edge from-layer="1885" from-port="2" to-layer="1886" to-port="0" /> <edge from-layer="1886" from-port="2" to-layer="1900" to-port="0" /> <edge from-layer="1887" from-port="0" to-layer="1890" to-port="1" /> <edge from-layer="1888" from-port="0" to-layer="1890" to-port="2" /> <edge from-layer="1889" from-port="0" to-layer="1890" to-port="3" /> <edge from-layer="1890" from-port="5" to-layer="1893" to-port="0" /> <edge from-layer="1891" from-port="0" to-layer="1892" to-port="0" /> <edge from-layer="1892" from-port="1" to-layer="1893" to-port="1" /> <edge from-layer="1893" from-port="2" to-layer="1898" to-port="0" /> <edge from-layer="1894" from-port="0" to-layer="1897" to-port="1" /> <edge from-layer="1895" from-port="0" to-layer="1897" to-port="2" /> <edge from-layer="1896" from-port="0" to-layer="1897" to-port="3" /> <edge from-layer="1897" from-port="5" to-layer="1898" to-port="1" /> <edge from-layer="1898" from-port="2" to-layer="1899" to-port="0" /> <edge from-layer="1899" from-port="2" to-layer="1900" to-port="1" /> <edge from-layer="1900" from-port="2" to-layer="1954" to-port="0" /> <edge from-layer="1901" from-port="0" to-layer="1902" to-port="0" /> <edge from-layer="1902" from-port="1" to-layer="1907" to-port="0" /> <edge from-layer="1903" from-port="0" to-layer="1906" to-port="1" /> <edge from-layer="1904" from-port="0" to-layer="1906" to-port="2" /> <edge from-layer="1905" from-port="0" to-layer="1906" to-port="3" /> <edge from-layer="1906" from-port="4" to-layer="1907" to-port="1" /> <edge from-layer="1907" from-port="2" to-layer="1908" to-port="0" /> <edge from-layer="1908" from-port="1" to-layer="1910" to-port="0" /> <edge from-layer="1909" from-port="0" to-layer="1910" to-port="2" /> <edge from-layer="1910" from-port="3" to-layer="1934" to-port="0" /> <edge from-layer="1911" from-port="0" to-layer="1914" to-port="1" /> <edge from-layer="1912" from-port="0" to-layer="1914" to-port="2" /> <edge from-layer="1913" from-port="0" to-layer="1914" to-port="3" /> <edge from-layer="1914" from-port="5" to-layer="1916" to-port="0" /> <edge from-layer="1915" from-port="0" to-layer="1916" to-port="1" /> <edge from-layer="1916" from-port="2" to-layer="1918" to-port="0" /> <edge from-layer="1917" from-port="0" to-layer="1918" to-port="1" /> <edge from-layer="1918" from-port="2" to-layer="1930" to-port="0" /> <edge from-layer="1918" from-port="2" to-layer="1923" to-port="0" /> <edge from-layer="1918" from-port="2" to-layer="1919" to-port="0" /> <edge from-layer="1919" from-port="2" to-layer="1933" to-port="0" /> <edge from-layer="1920" from-port="0" to-layer="1923" to-port="1" /> <edge from-layer="1921" from-port="0" to-layer="1923" to-port="2" /> <edge from-layer="1922" from-port="0" to-layer="1923" to-port="3" /> <edge from-layer="1923" from-port="5" to-layer="1926" to-port="0" /> <edge from-layer="1924" from-port="0" to-layer="1925" to-port="0" /> <edge from-layer="1925" from-port="1" to-layer="1926" to-port="1" /> <edge from-layer="1926" from-port="2" to-layer="1931" to-port="0" /> <edge from-layer="1927" from-port="0" to-layer="1930" to-port="1" /> <edge from-layer="1928" from-port="0" to-layer="1930" to-port="2" /> <edge from-layer="1929" from-port="0" to-layer="1930" to-port="3" /> <edge from-layer="1930" from-port="5" to-layer="1931" to-port="1" /> <edge from-layer="1931" from-port="2" to-layer="1932" to-port="0" /> <edge from-layer="1932" from-port="2" to-layer="1933" to-port="1" /> <edge from-layer="1933" from-port="2" to-layer="1934" to-port="1" /> <edge from-layer="1934" from-port="2" to-layer="1954" to-port="1" /> <edge from-layer="1934" from-port="2" to-layer="4300" to-port="0" /> <edge from-layer="1935" from-port="0" to-layer="1936" to-port="0" /> <edge from-layer="1936" from-port="1" to-layer="1941" to-port="0" /> <edge from-layer="1937" from-port="0" to-layer="1940" to-port="1" /> <edge from-layer="1938" from-port="0" to-layer="1940" to-port="2" /> <edge from-layer="1939" from-port="0" to-layer="1940" to-port="3" /> <edge from-layer="1940" from-port="4" to-layer="1941" to-port="1" /> <edge from-layer="1941" from-port="2" to-layer="1942" to-port="0" /> <edge from-layer="1942" from-port="1" to-layer="1944" to-port="0" /> <edge from-layer="1943" from-port="0" to-layer="1944" to-port="2" /> <edge from-layer="1944" from-port="3" to-layer="1953" to-port="0" /> <edge from-layer="1945" from-port="0" to-layer="1948" to-port="1" /> <edge from-layer="1946" from-port="0" to-layer="1948" to-port="2" /> <edge from-layer="1947" from-port="0" to-layer="1948" to-port="3" /> <edge from-layer="1948" from-port="5" to-layer="1950" to-port="0" /> <edge from-layer="1949" from-port="0" to-layer="1950" to-port="1" /> <edge from-layer="1950" from-port="2" to-layer="1952" to-port="0" /> <edge from-layer="1951" from-port="0" to-layer="1952" to-port="1" /> <edge from-layer="1952" from-port="2" to-layer="1953" to-port="1" /> <edge from-layer="1953" from-port="2" to-layer="4299" to-port="0" /> <edge from-layer="1953" from-port="2" to-layer="1954" to-port="2" /> <edge from-layer="1954" from-port="4" to-layer="1956" to-port="0" /> <edge from-layer="1955" from-port="0" to-layer="1956" to-port="1" /> <edge from-layer="1956" from-port="2" to-layer="1958" to-port="0" /> <edge from-layer="1957" from-port="0" to-layer="1958" to-port="1" /> <edge from-layer="1958" from-port="2" to-layer="1961" to-port="0" /> <edge from-layer="1959" from-port="0" to-layer="1960" to-port="0" /> <edge from-layer="1960" from-port="1" to-layer="1961" to-port="1" /> <edge from-layer="1961" from-port="2" to-layer="1962" to-port="1" /> <edge from-layer="1962" from-port="2" to-layer="1988" to-port="0" /> <edge from-layer="1962" from-port="2" to-layer="1977" to-port="0" /> <edge from-layer="1962" from-port="2" to-layer="1969" to-port="0" /> <edge from-layer="1963" from-port="0" to-layer="1964" to-port="0" /> <edge from-layer="1964" from-port="1" to-layer="1978" to-port="0" /> <edge from-layer="1965" from-port="0" to-layer="1966" to-port="0" /> <edge from-layer="1966" from-port="1" to-layer="1976" to-port="0" /> <edge from-layer="1967" from-port="0" to-layer="1968" to-port="0" /> <edge from-layer="1968" from-port="1" to-layer="1969" to-port="1" /> <edge from-layer="1969" from-port="2" to-layer="1971" to-port="0" /> <edge from-layer="1970" from-port="0" to-layer="1971" to-port="1" /> <edge from-layer="1971" from-port="2" to-layer="1974" to-port="0" /> <edge from-layer="1972" from-port="0" to-layer="1973" to-port="0" /> <edge from-layer="1973" from-port="1" to-layer="1974" to-port="1" /> <edge from-layer="1974" from-port="2" to-layer="1975" to-port="0" /> <edge from-layer="1975" from-port="1" to-layer="1976" to-port="1" /> <edge from-layer="1976" from-port="2" to-layer="1977" to-port="1" /> <edge from-layer="1977" from-port="2" to-layer="1978" to-port="1" /> <edge from-layer="1978" from-port="2" to-layer="1981" to-port="0" /> <edge from-layer="1979" from-port="0" to-layer="1980" to-port="0" /> <edge from-layer="1980" from-port="1" to-layer="1981" to-port="1" /> <edge from-layer="1981" from-port="2" to-layer="1982" to-port="0" /> <edge from-layer="1982" from-port="3" to-layer="1983" to-port="0" /> <edge from-layer="1982" from-port="4" to-layer="1984" to-port="0" /> <edge from-layer="1983" from-port="1" to-layer="1984" to-port="1" /> <edge from-layer="1984" from-port="2" to-layer="1987" to-port="0" /> <edge from-layer="1985" from-port="0" to-layer="1986" to-port="0" /> <edge from-layer="1986" from-port="1" to-layer="1987" to-port="1" /> <edge from-layer="1987" from-port="2" to-layer="1988" to-port="1" /> <edge from-layer="1988" from-port="2" to-layer="2003" to-port="0" /> <edge from-layer="1988" from-port="2" to-layer="1995" to-port="0" /> <edge from-layer="1988" from-port="2" to-layer="2092" to-port="0" /> <edge from-layer="1989" from-port="0" to-layer="1990" to-port="0" /> <edge from-layer="1990" from-port="1" to-layer="2004" to-port="0" /> <edge from-layer="1991" from-port="0" to-layer="1992" to-port="0" /> <edge from-layer="1992" from-port="1" to-layer="2002" to-port="0" /> <edge from-layer="1993" from-port="0" to-layer="1994" to-port="0" /> <edge from-layer="1994" from-port="1" to-layer="1995" to-port="1" /> <edge from-layer="1995" from-port="2" to-layer="1997" to-port="0" /> <edge from-layer="1996" from-port="0" to-layer="1997" to-port="1" /> <edge from-layer="1997" from-port="2" to-layer="2000" to-port="0" /> <edge from-layer="1998" from-port="0" to-layer="1999" to-port="0" /> <edge from-layer="1999" from-port="1" to-layer="2000" to-port="1" /> <edge from-layer="2000" from-port="2" to-layer="2001" to-port="0" /> <edge from-layer="2001" from-port="1" to-layer="2002" to-port="1" /> <edge from-layer="2002" from-port="2" to-layer="2003" to-port="1" /> <edge from-layer="2003" from-port="2" to-layer="2004" to-port="1" /> <edge from-layer="2004" from-port="2" to-layer="2007" to-port="0" /> <edge from-layer="2005" from-port="0" to-layer="2006" to-port="0" /> <edge from-layer="2006" from-port="1" to-layer="2007" to-port="1" /> <edge from-layer="2007" from-port="2" to-layer="2078" to-port="0" /> <edge from-layer="2007" from-port="2" to-layer="2011" to-port="0" /> <edge from-layer="2007" from-port="2" to-layer="2044" to-port="0" /> <edge from-layer="2008" from-port="0" to-layer="2011" to-port="1" /> <edge from-layer="2009" from-port="0" to-layer="2011" to-port="2" /> <edge from-layer="2010" from-port="0" to-layer="2011" to-port="3" /> <edge from-layer="2011" from-port="5" to-layer="2013" to-port="0" /> <edge from-layer="2012" from-port="0" to-layer="2013" to-port="1" /> <edge from-layer="2013" from-port="2" to-layer="2015" to-port="0" /> <edge from-layer="2014" from-port="0" to-layer="2015" to-port="1" /> <edge from-layer="2015" from-port="2" to-layer="2027" to-port="0" /> <edge from-layer="2015" from-port="2" to-layer="2020" to-port="0" /> <edge from-layer="2015" from-port="2" to-layer="2016" to-port="0" /> <edge from-layer="2016" from-port="2" to-layer="2030" to-port="0" /> <edge from-layer="2017" from-port="0" to-layer="2020" to-port="1" /> <edge from-layer="2018" from-port="0" to-layer="2020" to-port="2" /> <edge from-layer="2019" from-port="0" to-layer="2020" to-port="3" /> <edge from-layer="2020" from-port="5" to-layer="2023" to-port="0" /> <edge from-layer="2021" from-port="0" to-layer="2022" to-port="0" /> <edge from-layer="2022" from-port="1" to-layer="2023" to-port="1" /> <edge from-layer="2023" from-port="2" to-layer="2028" to-port="0" /> <edge from-layer="2024" from-port="0" to-layer="2027" to-port="1" /> <edge from-layer="2025" from-port="0" to-layer="2027" to-port="2" /> <edge from-layer="2026" from-port="0" to-layer="2027" to-port="3" /> <edge from-layer="2027" from-port="5" to-layer="2028" to-port="1" /> <edge from-layer="2028" from-port="2" to-layer="2029" to-port="0" /> <edge from-layer="2029" from-port="2" to-layer="2030" to-port="1" /> <edge from-layer="2030" from-port="2" to-layer="2084" to-port="0" /> <edge from-layer="2031" from-port="0" to-layer="2032" to-port="0" /> <edge from-layer="2032" from-port="1" to-layer="2037" to-port="0" /> <edge from-layer="2033" from-port="0" to-layer="2036" to-port="1" /> <edge from-layer="2034" from-port="0" to-layer="2036" to-port="2" /> <edge from-layer="2035" from-port="0" to-layer="2036" to-port="3" /> <edge from-layer="2036" from-port="4" to-layer="2037" to-port="1" /> <edge from-layer="2037" from-port="2" to-layer="2038" to-port="0" /> <edge from-layer="2038" from-port="1" to-layer="2040" to-port="0" /> <edge from-layer="2039" from-port="0" to-layer="2040" to-port="2" /> <edge from-layer="2040" from-port="3" to-layer="2064" to-port="0" /> <edge from-layer="2041" from-port="0" to-layer="2044" to-port="1" /> <edge from-layer="2042" from-port="0" to-layer="2044" to-port="2" /> <edge from-layer="2043" from-port="0" to-layer="2044" to-port="3" /> <edge from-layer="2044" from-port="5" to-layer="2046" to-port="0" /> <edge from-layer="2045" from-port="0" to-layer="2046" to-port="1" /> <edge from-layer="2046" from-port="2" to-layer="2048" to-port="0" /> <edge from-layer="2047" from-port="0" to-layer="2048" to-port="1" /> <edge from-layer="2048" from-port="2" to-layer="2049" to-port="0" /> <edge from-layer="2048" from-port="2" to-layer="2053" to-port="0" /> <edge from-layer="2048" from-port="2" to-layer="2060" to-port="0" /> <edge from-layer="2049" from-port="2" to-layer="2063" to-port="0" /> <edge from-layer="2050" from-port="0" to-layer="2053" to-port="1" /> <edge from-layer="2051" from-port="0" to-layer="2053" to-port="2" /> <edge from-layer="2052" from-port="0" to-layer="2053" to-port="3" /> <edge from-layer="2053" from-port="5" to-layer="2056" to-port="0" /> <edge from-layer="2054" from-port="0" to-layer="2055" to-port="0" /> <edge from-layer="2055" from-port="1" to-layer="2056" to-port="1" /> <edge from-layer="2056" from-port="2" to-layer="2061" to-port="0" /> <edge from-layer="2057" from-port="0" to-layer="2060" to-port="1" /> <edge from-layer="2058" from-port="0" to-layer="2060" to-port="2" /> <edge from-layer="2059" from-port="0" to-layer="2060" to-port="3" /> <edge from-layer="2060" from-port="5" to-layer="2061" to-port="1" /> <edge from-layer="2061" from-port="2" to-layer="2062" to-port="0" /> <edge from-layer="2062" from-port="2" to-layer="2063" to-port="1" /> <edge from-layer="2063" from-port="2" to-layer="2064" to-port="1" /> <edge from-layer="2064" from-port="2" to-layer="2084" to-port="1" /> <edge from-layer="2064" from-port="2" to-layer="4298" to-port="0" /> <edge from-layer="2065" from-port="0" to-layer="2066" to-port="0" /> <edge from-layer="2066" from-port="1" to-layer="2071" to-port="0" /> <edge from-layer="2067" from-port="0" to-layer="2070" to-port="1" /> <edge from-layer="2068" from-port="0" to-layer="2070" to-port="2" /> <edge from-layer="2069" from-port="0" to-layer="2070" to-port="3" /> <edge from-layer="2070" from-port="4" to-layer="2071" to-port="1" /> <edge from-layer="2071" from-port="2" to-layer="2072" to-port="0" /> <edge from-layer="2072" from-port="1" to-layer="2074" to-port="0" /> <edge from-layer="2073" from-port="0" to-layer="2074" to-port="2" /> <edge from-layer="2074" from-port="3" to-layer="2083" to-port="0" /> <edge from-layer="2075" from-port="0" to-layer="2078" to-port="1" /> <edge from-layer="2076" from-port="0" to-layer="2078" to-port="2" /> <edge from-layer="2077" from-port="0" to-layer="2078" to-port="3" /> <edge from-layer="2078" from-port="5" to-layer="2080" to-port="0" /> <edge from-layer="2079" from-port="0" to-layer="2080" to-port="1" /> <edge from-layer="2080" from-port="2" to-layer="2082" to-port="0" /> <edge from-layer="2081" from-port="0" to-layer="2082" to-port="1" /> <edge from-layer="2082" from-port="2" to-layer="2083" to-port="1" /> <edge from-layer="2083" from-port="2" to-layer="2084" to-port="2" /> <edge from-layer="2083" from-port="2" to-layer="4297" to-port="0" /> <edge from-layer="2084" from-port="4" to-layer="2086" to-port="0" /> <edge from-layer="2085" from-port="0" to-layer="2086" to-port="1" /> <edge from-layer="2086" from-port="2" to-layer="2088" to-port="0" /> <edge from-layer="2087" from-port="0" to-layer="2088" to-port="1" /> <edge from-layer="2088" from-port="2" to-layer="2091" to-port="0" /> <edge from-layer="2089" from-port="0" to-layer="2090" to-port="0" /> <edge from-layer="2090" from-port="1" to-layer="2091" to-port="1" /> <edge from-layer="2091" from-port="2" to-layer="2092" to-port="1" /> <edge from-layer="2092" from-port="2" to-layer="2118" to-port="0" /> <edge from-layer="2092" from-port="2" to-layer="2107" to-port="0" /> <edge from-layer="2092" from-port="2" to-layer="2099" to-port="0" /> <edge from-layer="2093" from-port="0" to-layer="2094" to-port="0" /> <edge from-layer="2094" from-port="1" to-layer="2108" to-port="0" /> <edge from-layer="2095" from-port="0" to-layer="2096" to-port="0" /> <edge from-layer="2096" from-port="1" to-layer="2106" to-port="0" /> <edge from-layer="2097" from-port="0" to-layer="2098" to-port="0" /> <edge from-layer="2098" from-port="1" to-layer="2099" to-port="1" /> <edge from-layer="2099" from-port="2" to-layer="2101" to-port="0" /> <edge from-layer="2100" from-port="0" to-layer="2101" to-port="1" /> <edge from-layer="2101" from-port="2" to-layer="2104" to-port="0" /> <edge from-layer="2102" from-port="0" to-layer="2103" to-port="0" /> <edge from-layer="2103" from-port="1" to-layer="2104" to-port="1" /> <edge from-layer="2104" from-port="2" to-layer="2105" to-port="0" /> <edge from-layer="2105" from-port="1" to-layer="2106" to-port="1" /> <edge from-layer="2106" from-port="2" to-layer="2107" to-port="1" /> <edge from-layer="2107" from-port="2" to-layer="2108" to-port="1" /> <edge from-layer="2108" from-port="2" to-layer="2111" to-port="0" /> <edge from-layer="2109" from-port="0" to-layer="2110" to-port="0" /> <edge from-layer="2110" from-port="1" to-layer="2111" to-port="1" /> <edge from-layer="2111" from-port="2" to-layer="2112" to-port="0" /> <edge from-layer="2112" from-port="4" to-layer="2114" to-port="0" /> <edge from-layer="2112" from-port="3" to-layer="2113" to-port="0" /> <edge from-layer="2113" from-port="1" to-layer="2114" to-port="1" /> <edge from-layer="2114" from-port="2" to-layer="2117" to-port="0" /> <edge from-layer="2115" from-port="0" to-layer="2116" to-port="0" /> <edge from-layer="2116" from-port="1" to-layer="2117" to-port="1" /> <edge from-layer="2117" from-port="2" to-layer="2118" to-port="1" /> <edge from-layer="2118" from-port="2" to-layer="2125" to-port="0" /> <edge from-layer="2118" from-port="2" to-layer="2222" to-port="0" /> <edge from-layer="2118" from-port="2" to-layer="2133" to-port="0" /> <edge from-layer="2119" from-port="0" to-layer="2120" to-port="0" /> <edge from-layer="2120" from-port="1" to-layer="2134" to-port="0" /> <edge from-layer="2121" from-port="0" to-layer="2122" to-port="0" /> <edge from-layer="2122" from-port="1" to-layer="2132" to-port="0" /> <edge from-layer="2123" from-port="0" to-layer="2124" to-port="0" /> <edge from-layer="2124" from-port="1" to-layer="2125" to-port="1" /> <edge from-layer="2125" from-port="2" to-layer="2127" to-port="0" /> <edge from-layer="2126" from-port="0" to-layer="2127" to-port="1" /> <edge from-layer="2127" from-port="2" to-layer="2130" to-port="0" /> <edge from-layer="2128" from-port="0" to-layer="2129" to-port="0" /> <edge from-layer="2129" from-port="1" to-layer="2130" to-port="1" /> <edge from-layer="2130" from-port="2" to-layer="2131" to-port="0" /> <edge from-layer="2131" from-port="1" to-layer="2132" to-port="1" /> <edge from-layer="2132" from-port="2" to-layer="2133" to-port="1" /> <edge from-layer="2133" from-port="2" to-layer="2134" to-port="1" /> <edge from-layer="2134" from-port="2" to-layer="2137" to-port="0" /> <edge from-layer="2135" from-port="0" to-layer="2136" to-port="0" /> <edge from-layer="2136" from-port="1" to-layer="2137" to-port="1" /> <edge from-layer="2137" from-port="2" to-layer="2141" to-port="0" /> <edge from-layer="2137" from-port="2" to-layer="2208" to-port="0" /> <edge from-layer="2137" from-port="2" to-layer="2174" to-port="0" /> <edge from-layer="2138" from-port="0" to-layer="2141" to-port="1" /> <edge from-layer="2139" from-port="0" to-layer="2141" to-port="2" /> <edge from-layer="2140" from-port="0" to-layer="2141" to-port="3" /> <edge from-layer="2141" from-port="5" to-layer="2143" to-port="0" /> <edge from-layer="2142" from-port="0" to-layer="2143" to-port="1" /> <edge from-layer="2143" from-port="2" to-layer="2145" to-port="0" /> <edge from-layer="2144" from-port="0" to-layer="2145" to-port="1" /> <edge from-layer="2145" from-port="2" to-layer="2157" to-port="0" /> <edge from-layer="2145" from-port="2" to-layer="2146" to-port="0" /> <edge from-layer="2145" from-port="2" to-layer="2150" to-port="0" /> <edge from-layer="2146" from-port="2" to-layer="2160" to-port="0" /> <edge from-layer="2147" from-port="0" to-layer="2150" to-port="1" /> <edge from-layer="2148" from-port="0" to-layer="2150" to-port="2" /> <edge from-layer="2149" from-port="0" to-layer="2150" to-port="3" /> <edge from-layer="2150" from-port="5" to-layer="2153" to-port="0" /> <edge from-layer="2151" from-port="0" to-layer="2152" to-port="0" /> <edge from-layer="2152" from-port="1" to-layer="2153" to-port="1" /> <edge from-layer="2153" from-port="2" to-layer="2158" to-port="0" /> <edge from-layer="2154" from-port="0" to-layer="2157" to-port="1" /> <edge from-layer="2155" from-port="0" to-layer="2157" to-port="2" /> <edge from-layer="2156" from-port="0" to-layer="2157" to-port="3" /> <edge from-layer="2157" from-port="5" to-layer="2158" to-port="1" /> <edge from-layer="2158" from-port="2" to-layer="2159" to-port="0" /> <edge from-layer="2159" from-port="2" to-layer="2160" to-port="1" /> <edge from-layer="2160" from-port="2" to-layer="2214" to-port="0" /> <edge from-layer="2161" from-port="0" to-layer="2162" to-port="0" /> <edge from-layer="2162" from-port="1" to-layer="2167" to-port="0" /> <edge from-layer="2163" from-port="0" to-layer="2166" to-port="1" /> <edge from-layer="2164" from-port="0" to-layer="2166" to-port="2" /> <edge from-layer="2165" from-port="0" to-layer="2166" to-port="3" /> <edge from-layer="2166" from-port="4" to-layer="2167" to-port="1" /> <edge from-layer="2167" from-port="2" to-layer="2168" to-port="0" /> <edge from-layer="2168" from-port="1" to-layer="2170" to-port="0" /> <edge from-layer="2169" from-port="0" to-layer="2170" to-port="2" /> <edge from-layer="2170" from-port="3" to-layer="2194" to-port="0" /> <edge from-layer="2171" from-port="0" to-layer="2174" to-port="1" /> <edge from-layer="2172" from-port="0" to-layer="2174" to-port="2" /> <edge from-layer="2173" from-port="0" to-layer="2174" to-port="3" /> <edge from-layer="2174" from-port="5" to-layer="2176" to-port="0" /> <edge from-layer="2175" from-port="0" to-layer="2176" to-port="1" /> <edge from-layer="2176" from-port="2" to-layer="2178" to-port="0" /> <edge from-layer="2177" from-port="0" to-layer="2178" to-port="1" /> <edge from-layer="2178" from-port="2" to-layer="2179" to-port="0" /> <edge from-layer="2178" from-port="2" to-layer="2190" to-port="0" /> <edge from-layer="2178" from-port="2" to-layer="2183" to-port="0" /> <edge from-layer="2179" from-port="2" to-layer="2193" to-port="0" /> <edge from-layer="2180" from-port="0" to-layer="2183" to-port="1" /> <edge from-layer="2181" from-port="0" to-layer="2183" to-port="2" /> <edge from-layer="2182" from-port="0" to-layer="2183" to-port="3" /> <edge from-layer="2183" from-port="5" to-layer="2186" to-port="0" /> <edge from-layer="2184" from-port="0" to-layer="2185" to-port="0" /> <edge from-layer="2185" from-port="1" to-layer="2186" to-port="1" /> <edge from-layer="2186" from-port="2" to-layer="2191" to-port="0" /> <edge from-layer="2187" from-port="0" to-layer="2190" to-port="1" /> <edge from-layer="2188" from-port="0" to-layer="2190" to-port="2" /> <edge from-layer="2189" from-port="0" to-layer="2190" to-port="3" /> <edge from-layer="2190" from-port="5" to-layer="2191" to-port="1" /> <edge from-layer="2191" from-port="2" to-layer="2192" to-port="0" /> <edge from-layer="2192" from-port="2" to-layer="2193" to-port="1" /> <edge from-layer="2193" from-port="2" to-layer="2194" to-port="1" /> <edge from-layer="2194" from-port="2" to-layer="4296" to-port="0" /> <edge from-layer="2194" from-port="2" to-layer="2214" to-port="1" /> <edge from-layer="2195" from-port="0" to-layer="2196" to-port="0" /> <edge from-layer="2196" from-port="1" to-layer="2201" to-port="0" /> <edge from-layer="2197" from-port="0" to-layer="2200" to-port="1" /> <edge from-layer="2198" from-port="0" to-layer="2200" to-port="2" /> <edge from-layer="2199" from-port="0" to-layer="2200" to-port="3" /> <edge from-layer="2200" from-port="4" to-layer="2201" to-port="1" /> <edge from-layer="2201" from-port="2" to-layer="2202" to-port="0" /> <edge from-layer="2202" from-port="1" to-layer="2204" to-port="0" /> <edge from-layer="2203" from-port="0" to-layer="2204" to-port="2" /> <edge from-layer="2204" from-port="3" to-layer="2213" to-port="0" /> <edge from-layer="2205" from-port="0" to-layer="2208" to-port="1" /> <edge from-layer="2206" from-port="0" to-layer="2208" to-port="2" /> <edge from-layer="2207" from-port="0" to-layer="2208" to-port="3" /> <edge from-layer="2208" from-port="5" to-layer="2210" to-port="0" /> <edge from-layer="2209" from-port="0" to-layer="2210" to-port="1" /> <edge from-layer="2210" from-port="2" to-layer="2212" to-port="0" /> <edge from-layer="2211" from-port="0" to-layer="2212" to-port="1" /> <edge from-layer="2212" from-port="2" to-layer="2213" to-port="1" /> <edge from-layer="2213" from-port="2" to-layer="4295" to-port="0" /> <edge from-layer="2213" from-port="2" to-layer="2214" to-port="2" /> <edge from-layer="2214" from-port="4" to-layer="2216" to-port="0" /> <edge from-layer="2215" from-port="0" to-layer="2216" to-port="1" /> <edge from-layer="2216" from-port="2" to-layer="2218" to-port="0" /> <edge from-layer="2217" from-port="0" to-layer="2218" to-port="1" /> <edge from-layer="2218" from-port="2" to-layer="2221" to-port="0" /> <edge from-layer="2219" from-port="0" to-layer="2220" to-port="0" /> <edge from-layer="2220" from-port="1" to-layer="2221" to-port="1" /> <edge from-layer="2221" from-port="2" to-layer="2222" to-port="1" /> <edge from-layer="2222" from-port="2" to-layer="2237" to-port="0" /> <edge from-layer="2222" from-port="2" to-layer="2229" to-port="0" /> <edge from-layer="2222" from-port="2" to-layer="2248" to-port="0" /> <edge from-layer="2223" from-port="0" to-layer="2224" to-port="0" /> <edge from-layer="2224" from-port="1" to-layer="2238" to-port="0" /> <edge from-layer="2225" from-port="0" to-layer="2226" to-port="0" /> <edge from-layer="2226" from-port="1" to-layer="2236" to-port="0" /> <edge from-layer="2227" from-port="0" to-layer="2228" to-port="0" /> <edge from-layer="2228" from-port="1" to-layer="2229" to-port="1" /> <edge from-layer="2229" from-port="2" to-layer="2231" to-port="0" /> <edge from-layer="2230" from-port="0" to-layer="2231" to-port="1" /> <edge from-layer="2231" from-port="2" to-layer="2234" to-port="0" /> <edge from-layer="2232" from-port="0" to-layer="2233" to-port="0" /> <edge from-layer="2233" from-port="1" to-layer="2234" to-port="1" /> <edge from-layer="2234" from-port="2" to-layer="2235" to-port="0" /> <edge from-layer="2235" from-port="1" to-layer="2236" to-port="1" /> <edge from-layer="2236" from-port="2" to-layer="2237" to-port="1" /> <edge from-layer="2237" from-port="2" to-layer="2238" to-port="1" /> <edge from-layer="2238" from-port="2" to-layer="2241" to-port="0" /> <edge from-layer="2239" from-port="0" to-layer="2240" to-port="0" /> <edge from-layer="2240" from-port="1" to-layer="2241" to-port="1" /> <edge from-layer="2241" from-port="2" to-layer="2242" to-port="0" /> <edge from-layer="2242" from-port="4" to-layer="2244" to-port="0" /> <edge from-layer="2242" from-port="3" to-layer="2243" to-port="0" /> <edge from-layer="2243" from-port="1" to-layer="2244" to-port="1" /> <edge from-layer="2244" from-port="2" to-layer="2247" to-port="0" /> <edge from-layer="2245" from-port="0" to-layer="2246" to-port="0" /> <edge from-layer="2246" from-port="1" to-layer="2247" to-port="1" /> <edge from-layer="2247" from-port="2" to-layer="2248" to-port="1" /> <edge from-layer="2248" from-port="2" to-layer="2352" to-port="0" /> <edge from-layer="2248" from-port="2" to-layer="2263" to-port="0" /> <edge from-layer="2248" from-port="2" to-layer="2255" to-port="0" /> <edge from-layer="2249" from-port="0" to-layer="2250" to-port="0" /> <edge from-layer="2250" from-port="1" to-layer="2264" to-port="0" /> <edge from-layer="2251" from-port="0" to-layer="2252" to-port="0" /> <edge from-layer="2252" from-port="1" to-layer="2262" to-port="0" /> <edge from-layer="2253" from-port="0" to-layer="2254" to-port="0" /> <edge from-layer="2254" from-port="1" to-layer="2255" to-port="1" /> <edge from-layer="2255" from-port="2" to-layer="2257" to-port="0" /> <edge from-layer="2256" from-port="0" to-layer="2257" to-port="1" /> <edge from-layer="2257" from-port="2" to-layer="2260" to-port="0" /> <edge from-layer="2258" from-port="0" to-layer="2259" to-port="0" /> <edge from-layer="2259" from-port="1" to-layer="2260" to-port="1" /> <edge from-layer="2260" from-port="2" to-layer="2261" to-port="0" /> <edge from-layer="2261" from-port="1" to-layer="2262" to-port="1" /> <edge from-layer="2262" from-port="2" to-layer="2263" to-port="1" /> <edge from-layer="2263" from-port="2" to-layer="2264" to-port="1" /> <edge from-layer="2264" from-port="2" to-layer="2267" to-port="0" /> <edge from-layer="2265" from-port="0" to-layer="2266" to-port="0" /> <edge from-layer="2266" from-port="1" to-layer="2267" to-port="1" /> <edge from-layer="2267" from-port="2" to-layer="2271" to-port="0" /> <edge from-layer="2267" from-port="2" to-layer="2304" to-port="0" /> <edge from-layer="2267" from-port="2" to-layer="2338" to-port="0" /> <edge from-layer="2268" from-port="0" to-layer="2271" to-port="1" /> <edge from-layer="2269" from-port="0" to-layer="2271" to-port="2" /> <edge from-layer="2270" from-port="0" to-layer="2271" to-port="3" /> <edge from-layer="2271" from-port="5" to-layer="2273" to-port="0" /> <edge from-layer="2272" from-port="0" to-layer="2273" to-port="1" /> <edge from-layer="2273" from-port="2" to-layer="2275" to-port="0" /> <edge from-layer="2274" from-port="0" to-layer="2275" to-port="1" /> <edge from-layer="2275" from-port="2" to-layer="2287" to-port="0" /> <edge from-layer="2275" from-port="2" to-layer="2276" to-port="0" /> <edge from-layer="2275" from-port="2" to-layer="2280" to-port="0" /> <edge from-layer="2276" from-port="2" to-layer="2290" to-port="0" /> <edge from-layer="2277" from-port="0" to-layer="2280" to-port="1" /> <edge from-layer="2278" from-port="0" to-layer="2280" to-port="2" /> <edge from-layer="2279" from-port="0" to-layer="2280" to-port="3" /> <edge from-layer="2280" from-port="5" to-layer="2283" to-port="0" /> <edge from-layer="2281" from-port="0" to-layer="2282" to-port="0" /> <edge from-layer="2282" from-port="1" to-layer="2283" to-port="1" /> <edge from-layer="2283" from-port="2" to-layer="2288" to-port="0" /> <edge from-layer="2284" from-port="0" to-layer="2287" to-port="1" /> <edge from-layer="2285" from-port="0" to-layer="2287" to-port="2" /> <edge from-layer="2286" from-port="0" to-layer="2287" to-port="3" /> <edge from-layer="2287" from-port="5" to-layer="2288" to-port="1" /> <edge from-layer="2288" from-port="2" to-layer="2289" to-port="0" /> <edge from-layer="2289" from-port="2" to-layer="2290" to-port="1" /> <edge from-layer="2290" from-port="2" to-layer="2344" to-port="0" /> <edge from-layer="2291" from-port="0" to-layer="2292" to-port="0" /> <edge from-layer="2292" from-port="1" to-layer="2297" to-port="0" /> <edge from-layer="2293" from-port="0" to-layer="2296" to-port="1" /> <edge from-layer="2294" from-port="0" to-layer="2296" to-port="2" /> <edge from-layer="2295" from-port="0" to-layer="2296" to-port="3" /> <edge from-layer="2296" from-port="4" to-layer="2297" to-port="1" /> <edge from-layer="2297" from-port="2" to-layer="2298" to-port="0" /> <edge from-layer="2298" from-port="1" to-layer="2300" to-port="0" /> <edge from-layer="2299" from-port="0" to-layer="2300" to-port="2" /> <edge from-layer="2300" from-port="3" to-layer="2324" to-port="0" /> <edge from-layer="2301" from-port="0" to-layer="2304" to-port="1" /> <edge from-layer="2302" from-port="0" to-layer="2304" to-port="2" /> <edge from-layer="2303" from-port="0" to-layer="2304" to-port="3" /> <edge from-layer="2304" from-port="5" to-layer="2306" to-port="0" /> <edge from-layer="2305" from-port="0" to-layer="2306" to-port="1" /> <edge from-layer="2306" from-port="2" to-layer="2308" to-port="0" /> <edge from-layer="2307" from-port="0" to-layer="2308" to-port="1" /> <edge from-layer="2308" from-port="2" to-layer="2309" to-port="0" /> <edge from-layer="2308" from-port="2" to-layer="2313" to-port="0" /> <edge from-layer="2308" from-port="2" to-layer="2320" to-port="0" /> <edge from-layer="2309" from-port="2" to-layer="2323" to-port="0" /> <edge from-layer="2310" from-port="0" to-layer="2313" to-port="1" /> <edge from-layer="2311" from-port="0" to-layer="2313" to-port="2" /> <edge from-layer="2312" from-port="0" to-layer="2313" to-port="3" /> <edge from-layer="2313" from-port="5" to-layer="2316" to-port="0" /> <edge from-layer="2314" from-port="0" to-layer="2315" to-port="0" /> <edge from-layer="2315" from-port="1" to-layer="2316" to-port="1" /> <edge from-layer="2316" from-port="2" to-layer="2321" to-port="0" /> <edge from-layer="2317" from-port="0" to-layer="2320" to-port="1" /> <edge from-layer="2318" from-port="0" to-layer="2320" to-port="2" /> <edge from-layer="2319" from-port="0" to-layer="2320" to-port="3" /> <edge from-layer="2320" from-port="5" to-layer="2321" to-port="1" /> <edge from-layer="2321" from-port="2" to-layer="2322" to-port="0" /> <edge from-layer="2322" from-port="2" to-layer="2323" to-port="1" /> <edge from-layer="2323" from-port="2" to-layer="2324" to-port="1" /> <edge from-layer="2324" from-port="2" to-layer="2344" to-port="1" /> <edge from-layer="2324" from-port="2" to-layer="4294" to-port="0" /> <edge from-layer="2325" from-port="0" to-layer="2326" to-port="0" /> <edge from-layer="2326" from-port="1" to-layer="2331" to-port="0" /> <edge from-layer="2327" from-port="0" to-layer="2330" to-port="1" /> <edge from-layer="2328" from-port="0" to-layer="2330" to-port="2" /> <edge from-layer="2329" from-port="0" to-layer="2330" to-port="3" /> <edge from-layer="2330" from-port="4" to-layer="2331" to-port="1" /> <edge from-layer="2331" from-port="2" to-layer="2332" to-port="0" /> <edge from-layer="2332" from-port="1" to-layer="2334" to-port="0" /> <edge from-layer="2333" from-port="0" to-layer="2334" to-port="2" /> <edge from-layer="2334" from-port="3" to-layer="2343" to-port="0" /> <edge from-layer="2335" from-port="0" to-layer="2338" to-port="1" /> <edge from-layer="2336" from-port="0" to-layer="2338" to-port="2" /> <edge from-layer="2337" from-port="0" to-layer="2338" to-port="3" /> <edge from-layer="2338" from-port="5" to-layer="2340" to-port="0" /> <edge from-layer="2339" from-port="0" to-layer="2340" to-port="1" /> <edge from-layer="2340" from-port="2" to-layer="2342" to-port="0" /> <edge from-layer="2341" from-port="0" to-layer="2342" to-port="1" /> <edge from-layer="2342" from-port="2" to-layer="2343" to-port="1" /> <edge from-layer="2343" from-port="2" to-layer="4293" to-port="0" /> <edge from-layer="2343" from-port="2" to-layer="2344" to-port="2" /> <edge from-layer="2344" from-port="4" to-layer="2346" to-port="0" /> <edge from-layer="2345" from-port="0" to-layer="2346" to-port="1" /> <edge from-layer="2346" from-port="2" to-layer="2348" to-port="0" /> <edge from-layer="2347" from-port="0" to-layer="2348" to-port="1" /> <edge from-layer="2348" from-port="2" to-layer="2351" to-port="0" /> <edge from-layer="2349" from-port="0" to-layer="2350" to-port="0" /> <edge from-layer="2350" from-port="1" to-layer="2351" to-port="1" /> <edge from-layer="2351" from-port="2" to-layer="2352" to-port="1" /> <edge from-layer="2352" from-port="2" to-layer="2359" to-port="0" /> <edge from-layer="2352" from-port="2" to-layer="2378" to-port="0" /> <edge from-layer="2352" from-port="2" to-layer="2367" to-port="0" /> <edge from-layer="2353" from-port="0" to-layer="2354" to-port="0" /> <edge from-layer="2354" from-port="1" to-layer="2368" to-port="0" /> <edge from-layer="2355" from-port="0" to-layer="2356" to-port="0" /> <edge from-layer="2356" from-port="1" to-layer="2366" to-port="0" /> <edge from-layer="2357" from-port="0" to-layer="2358" to-port="0" /> <edge from-layer="2358" from-port="1" to-layer="2359" to-port="1" /> <edge from-layer="2359" from-port="2" to-layer="2361" to-port="0" /> <edge from-layer="2360" from-port="0" to-layer="2361" to-port="1" /> <edge from-layer="2361" from-port="2" to-layer="2364" to-port="0" /> <edge from-layer="2362" from-port="0" to-layer="2363" to-port="0" /> <edge from-layer="2363" from-port="1" to-layer="2364" to-port="1" /> <edge from-layer="2364" from-port="2" to-layer="2365" to-port="0" /> <edge from-layer="2365" from-port="1" to-layer="2366" to-port="1" /> <edge from-layer="2366" from-port="2" to-layer="2367" to-port="1" /> <edge from-layer="2367" from-port="2" to-layer="2368" to-port="1" /> <edge from-layer="2368" from-port="2" to-layer="2371" to-port="0" /> <edge from-layer="2369" from-port="0" to-layer="2370" to-port="0" /> <edge from-layer="2370" from-port="1" to-layer="2371" to-port="1" /> <edge from-layer="2371" from-port="2" to-layer="2372" to-port="0" /> <edge from-layer="2372" from-port="4" to-layer="2374" to-port="0" /> <edge from-layer="2372" from-port="3" to-layer="2373" to-port="0" /> <edge from-layer="2373" from-port="1" to-layer="2374" to-port="1" /> <edge from-layer="2374" from-port="2" to-layer="2377" to-port="0" /> <edge from-layer="2375" from-port="0" to-layer="2376" to-port="0" /> <edge from-layer="2376" from-port="1" to-layer="2377" to-port="1" /> <edge from-layer="2377" from-port="2" to-layer="2378" to-port="1" /> <edge from-layer="2378" from-port="2" to-layer="2482" to-port="0" /> <edge from-layer="2378" from-port="2" to-layer="2393" to-port="0" /> <edge from-layer="2378" from-port="2" to-layer="2385" to-port="0" /> <edge from-layer="2379" from-port="0" to-layer="2380" to-port="0" /> <edge from-layer="2380" from-port="1" to-layer="2394" to-port="0" /> <edge from-layer="2381" from-port="0" to-layer="2382" to-port="0" /> <edge from-layer="2382" from-port="1" to-layer="2392" to-port="0" /> <edge from-layer="2383" from-port="0" to-layer="2384" to-port="0" /> <edge from-layer="2384" from-port="1" to-layer="2385" to-port="1" /> <edge from-layer="2385" from-port="2" to-layer="2387" to-port="0" /> <edge from-layer="2386" from-port="0" to-layer="2387" to-port="1" /> <edge from-layer="2387" from-port="2" to-layer="2390" to-port="0" /> <edge from-layer="2388" from-port="0" to-layer="2389" to-port="0" /> <edge from-layer="2389" from-port="1" to-layer="2390" to-port="1" /> <edge from-layer="2390" from-port="2" to-layer="2391" to-port="0" /> <edge from-layer="2391" from-port="1" to-layer="2392" to-port="1" /> <edge from-layer="2392" from-port="2" to-layer="2393" to-port="1" /> <edge from-layer="2393" from-port="2" to-layer="2394" to-port="1" /> <edge from-layer="2394" from-port="2" to-layer="2397" to-port="0" /> <edge from-layer="2395" from-port="0" to-layer="2396" to-port="0" /> <edge from-layer="2396" from-port="1" to-layer="2397" to-port="1" /> <edge from-layer="2397" from-port="2" to-layer="2401" to-port="0" /> <edge from-layer="2397" from-port="2" to-layer="2468" to-port="0" /> <edge from-layer="2397" from-port="2" to-layer="2434" to-port="0" /> <edge from-layer="2398" from-port="0" to-layer="2401" to-port="1" /> <edge from-layer="2399" from-port="0" to-layer="2401" to-port="2" /> <edge from-layer="2400" from-port="0" to-layer="2401" to-port="3" /> <edge from-layer="2401" from-port="5" to-layer="2403" to-port="0" /> <edge from-layer="2402" from-port="0" to-layer="2403" to-port="1" /> <edge from-layer="2403" from-port="2" to-layer="2405" to-port="0" /> <edge from-layer="2404" from-port="0" to-layer="2405" to-port="1" /> <edge from-layer="2405" from-port="2" to-layer="2410" to-port="0" /> <edge from-layer="2405" from-port="2" to-layer="2406" to-port="0" /> <edge from-layer="2405" from-port="2" to-layer="2417" to-port="0" /> <edge from-layer="2406" from-port="2" to-layer="2420" to-port="0" /> <edge from-layer="2407" from-port="0" to-layer="2410" to-port="1" /> <edge from-layer="2408" from-port="0" to-layer="2410" to-port="2" /> <edge from-layer="2409" from-port="0" to-layer="2410" to-port="3" /> <edge from-layer="2410" from-port="5" to-layer="2413" to-port="0" /> <edge from-layer="2411" from-port="0" to-layer="2412" to-port="0" /> <edge from-layer="2412" from-port="1" to-layer="2413" to-port="1" /> <edge from-layer="2413" from-port="2" to-layer="2418" to-port="0" /> <edge from-layer="2414" from-port="0" to-layer="2417" to-port="1" /> <edge from-layer="2415" from-port="0" to-layer="2417" to-port="2" /> <edge from-layer="2416" from-port="0" to-layer="2417" to-port="3" /> <edge from-layer="2417" from-port="5" to-layer="2418" to-port="1" /> <edge from-layer="2418" from-port="2" to-layer="2419" to-port="0" /> <edge from-layer="2419" from-port="2" to-layer="2420" to-port="1" /> <edge from-layer="2420" from-port="2" to-layer="2474" to-port="0" /> <edge from-layer="2421" from-port="0" to-layer="2422" to-port="0" /> <edge from-layer="2422" from-port="1" to-layer="2427" to-port="0" /> <edge from-layer="2423" from-port="0" to-layer="2426" to-port="1" /> <edge from-layer="2424" from-port="0" to-layer="2426" to-port="2" /> <edge from-layer="2425" from-port="0" to-layer="2426" to-port="3" /> <edge from-layer="2426" from-port="4" to-layer="2427" to-port="1" /> <edge from-layer="2427" from-port="2" to-layer="2428" to-port="0" /> <edge from-layer="2428" from-port="1" to-layer="2430" to-port="0" /> <edge from-layer="2429" from-port="0" to-layer="2430" to-port="2" /> <edge from-layer="2430" from-port="3" to-layer="2454" to-port="0" /> <edge from-layer="2431" from-port="0" to-layer="2434" to-port="1" /> <edge from-layer="2432" from-port="0" to-layer="2434" to-port="2" /> <edge from-layer="2433" from-port="0" to-layer="2434" to-port="3" /> <edge from-layer="2434" from-port="5" to-layer="2436" to-port="0" /> <edge from-layer="2435" from-port="0" to-layer="2436" to-port="1" /> <edge from-layer="2436" from-port="2" to-layer="2438" to-port="0" /> <edge from-layer="2437" from-port="0" to-layer="2438" to-port="1" /> <edge from-layer="2438" from-port="2" to-layer="2439" to-port="0" /> <edge from-layer="2438" from-port="2" to-layer="2443" to-port="0" /> <edge from-layer="2438" from-port="2" to-layer="2450" to-port="0" /> <edge from-layer="2439" from-port="2" to-layer="2453" to-port="0" /> <edge from-layer="2440" from-port="0" to-layer="2443" to-port="1" /> <edge from-layer="2441" from-port="0" to-layer="2443" to-port="2" /> <edge from-layer="2442" from-port="0" to-layer="2443" to-port="3" /> <edge from-layer="2443" from-port="5" to-layer="2446" to-port="0" /> <edge from-layer="2444" from-port="0" to-layer="2445" to-port="0" /> <edge from-layer="2445" from-port="1" to-layer="2446" to-port="1" /> <edge from-layer="2446" from-port="2" to-layer="2451" to-port="0" /> <edge from-layer="2447" from-port="0" to-layer="2450" to-port="1" /> <edge from-layer="2448" from-port="0" to-layer="2450" to-port="2" /> <edge from-layer="2449" from-port="0" to-layer="2450" to-port="3" /> <edge from-layer="2450" from-port="5" to-layer="2451" to-port="1" /> <edge from-layer="2451" from-port="2" to-layer="2452" to-port="0" /> <edge from-layer="2452" from-port="2" to-layer="2453" to-port="1" /> <edge from-layer="2453" from-port="2" to-layer="2454" to-port="1" /> <edge from-layer="2454" from-port="2" to-layer="2474" to-port="1" /> <edge from-layer="2454" from-port="2" to-layer="4292" to-port="0" /> <edge from-layer="2455" from-port="0" to-layer="2456" to-port="0" /> <edge from-layer="2456" from-port="1" to-layer="2461" to-port="0" /> <edge from-layer="2457" from-port="0" to-layer="2460" to-port="1" /> <edge from-layer="2458" from-port="0" to-layer="2460" to-port="2" /> <edge from-layer="2459" from-port="0" to-layer="2460" to-port="3" /> <edge from-layer="2460" from-port="4" to-layer="2461" to-port="1" /> <edge from-layer="2461" from-port="2" to-layer="2462" to-port="0" /> <edge from-layer="2462" from-port="1" to-layer="2464" to-port="0" /> <edge from-layer="2463" from-port="0" to-layer="2464" to-port="2" /> <edge from-layer="2464" from-port="3" to-layer="2473" to-port="0" /> <edge from-layer="2465" from-port="0" to-layer="2468" to-port="1" /> <edge from-layer="2466" from-port="0" to-layer="2468" to-port="2" /> <edge from-layer="2467" from-port="0" to-layer="2468" to-port="3" /> <edge from-layer="2468" from-port="5" to-layer="2470" to-port="0" /> <edge from-layer="2469" from-port="0" to-layer="2470" to-port="1" /> <edge from-layer="2470" from-port="2" to-layer="2472" to-port="0" /> <edge from-layer="2471" from-port="0" to-layer="2472" to-port="1" /> <edge from-layer="2472" from-port="2" to-layer="2473" to-port="1" /> <edge from-layer="2473" from-port="2" to-layer="2474" to-port="2" /> <edge from-layer="2473" from-port="2" to-layer="4291" to-port="0" /> <edge from-layer="2474" from-port="4" to-layer="2476" to-port="0" /> <edge from-layer="2475" from-port="0" to-layer="2476" to-port="1" /> <edge from-layer="2476" from-port="2" to-layer="2478" to-port="0" /> <edge from-layer="2477" from-port="0" to-layer="2478" to-port="1" /> <edge from-layer="2478" from-port="2" to-layer="2481" to-port="0" /> <edge from-layer="2479" from-port="0" to-layer="2480" to-port="0" /> <edge from-layer="2480" from-port="1" to-layer="2481" to-port="1" /> <edge from-layer="2481" from-port="2" to-layer="2482" to-port="1" /> <edge from-layer="2482" from-port="2" to-layer="2489" to-port="0" /> <edge from-layer="2482" from-port="2" to-layer="2497" to-port="0" /> <edge from-layer="2482" from-port="2" to-layer="2508" to-port="0" /> <edge from-layer="2483" from-port="0" to-layer="2484" to-port="0" /> <edge from-layer="2484" from-port="1" to-layer="2498" to-port="0" /> <edge from-layer="2485" from-port="0" to-layer="2486" to-port="0" /> <edge from-layer="2486" from-port="1" to-layer="2496" to-port="0" /> <edge from-layer="2487" from-port="0" to-layer="2488" to-port="0" /> <edge from-layer="2488" from-port="1" to-layer="2489" to-port="1" /> <edge from-layer="2489" from-port="2" to-layer="2491" to-port="0" /> <edge from-layer="2490" from-port="0" to-layer="2491" to-port="1" /> <edge from-layer="2491" from-port="2" to-layer="2494" to-port="0" /> <edge from-layer="2492" from-port="0" to-layer="2493" to-port="0" /> <edge from-layer="2493" from-port="1" to-layer="2494" to-port="1" /> <edge from-layer="2494" from-port="2" to-layer="2495" to-port="0" /> <edge from-layer="2495" from-port="1" to-layer="2496" to-port="1" /> <edge from-layer="2496" from-port="2" to-layer="2497" to-port="1" /> <edge from-layer="2497" from-port="2" to-layer="2498" to-port="1" /> <edge from-layer="2498" from-port="2" to-layer="2501" to-port="0" /> <edge from-layer="2499" from-port="0" to-layer="2500" to-port="0" /> <edge from-layer="2500" from-port="1" to-layer="2501" to-port="1" /> <edge from-layer="2501" from-port="2" to-layer="2502" to-port="0" /> <edge from-layer="2502" from-port="4" to-layer="2504" to-port="0" /> <edge from-layer="2502" from-port="3" to-layer="2503" to-port="0" /> <edge from-layer="2503" from-port="1" to-layer="2504" to-port="1" /> <edge from-layer="2504" from-port="2" to-layer="2507" to-port="0" /> <edge from-layer="2505" from-port="0" to-layer="2506" to-port="0" /> <edge from-layer="2506" from-port="1" to-layer="2507" to-port="1" /> <edge from-layer="2507" from-port="2" to-layer="2508" to-port="1" /> <edge from-layer="2508" from-port="2" to-layer="2612" to-port="0" /> <edge from-layer="2508" from-port="2" to-layer="2523" to-port="0" /> <edge from-layer="2508" from-port="2" to-layer="2515" to-port="0" /> <edge from-layer="2509" from-port="0" to-layer="2510" to-port="0" /> <edge from-layer="2510" from-port="1" to-layer="2524" to-port="0" /> <edge from-layer="2511" from-port="0" to-layer="2512" to-port="0" /> <edge from-layer="2512" from-port="1" to-layer="2522" to-port="0" /> <edge from-layer="2513" from-port="0" to-layer="2514" to-port="0" /> <edge from-layer="2514" from-port="1" to-layer="2515" to-port="1" /> <edge from-layer="2515" from-port="2" to-layer="2517" to-port="0" /> <edge from-layer="2516" from-port="0" to-layer="2517" to-port="1" /> <edge from-layer="2517" from-port="2" to-layer="2520" to-port="0" /> <edge from-layer="2518" from-port="0" to-layer="2519" to-port="0" /> <edge from-layer="2519" from-port="1" to-layer="2520" to-port="1" /> <edge from-layer="2520" from-port="2" to-layer="2521" to-port="0" /> <edge from-layer="2521" from-port="1" to-layer="2522" to-port="1" /> <edge from-layer="2522" from-port="2" to-layer="2523" to-port="1" /> <edge from-layer="2523" from-port="2" to-layer="2524" to-port="1" /> <edge from-layer="2524" from-port="2" to-layer="2527" to-port="0" /> <edge from-layer="2525" from-port="0" to-layer="2526" to-port="0" /> <edge from-layer="2526" from-port="1" to-layer="2527" to-port="1" /> <edge from-layer="2527" from-port="2" to-layer="2598" to-port="0" /> <edge from-layer="2527" from-port="2" to-layer="2531" to-port="0" /> <edge from-layer="2527" from-port="2" to-layer="2564" to-port="0" /> <edge from-layer="2528" from-port="0" to-layer="2531" to-port="1" /> <edge from-layer="2529" from-port="0" to-layer="2531" to-port="2" /> <edge from-layer="2530" from-port="0" to-layer="2531" to-port="3" /> <edge from-layer="2531" from-port="5" to-layer="2533" to-port="0" /> <edge from-layer="2532" from-port="0" to-layer="2533" to-port="1" /> <edge from-layer="2533" from-port="2" to-layer="2535" to-port="0" /> <edge from-layer="2534" from-port="0" to-layer="2535" to-port="1" /> <edge from-layer="2535" from-port="2" to-layer="2536" to-port="0" /> <edge from-layer="2535" from-port="2" to-layer="2540" to-port="0" /> <edge from-layer="2535" from-port="2" to-layer="2547" to-port="0" /> <edge from-layer="2536" from-port="2" to-layer="2550" to-port="0" /> <edge from-layer="2537" from-port="0" to-layer="2540" to-port="1" /> <edge from-layer="2538" from-port="0" to-layer="2540" to-port="2" /> <edge from-layer="2539" from-port="0" to-layer="2540" to-port="3" /> <edge from-layer="2540" from-port="5" to-layer="2543" to-port="0" /> <edge from-layer="2541" from-port="0" to-layer="2542" to-port="0" /> <edge from-layer="2542" from-port="1" to-layer="2543" to-port="1" /> <edge from-layer="2543" from-port="2" to-layer="2548" to-port="0" /> <edge from-layer="2544" from-port="0" to-layer="2547" to-port="1" /> <edge from-layer="2545" from-port="0" to-layer="2547" to-port="2" /> <edge from-layer="2546" from-port="0" to-layer="2547" to-port="3" /> <edge from-layer="2547" from-port="5" to-layer="2548" to-port="1" /> <edge from-layer="2548" from-port="2" to-layer="2549" to-port="0" /> <edge from-layer="2549" from-port="2" to-layer="2550" to-port="1" /> <edge from-layer="2550" from-port="2" to-layer="2604" to-port="0" /> <edge from-layer="2551" from-port="0" to-layer="2552" to-port="0" /> <edge from-layer="2552" from-port="1" to-layer="2557" to-port="0" /> <edge from-layer="2553" from-port="0" to-layer="2556" to-port="1" /> <edge from-layer="2554" from-port="0" to-layer="2556" to-port="2" /> <edge from-layer="2555" from-port="0" to-layer="2556" to-port="3" /> <edge from-layer="2556" from-port="4" to-layer="2557" to-port="1" /> <edge from-layer="2557" from-port="2" to-layer="2558" to-port="0" /> <edge from-layer="2558" from-port="1" to-layer="2560" to-port="0" /> <edge from-layer="2559" from-port="0" to-layer="2560" to-port="2" /> <edge from-layer="2560" from-port="3" to-layer="2584" to-port="0" /> <edge from-layer="2561" from-port="0" to-layer="2564" to-port="1" /> <edge from-layer="2562" from-port="0" to-layer="2564" to-port="2" /> <edge from-layer="2563" from-port="0" to-layer="2564" to-port="3" /> <edge from-layer="2564" from-port="5" to-layer="2566" to-port="0" /> <edge from-layer="2565" from-port="0" to-layer="2566" to-port="1" /> <edge from-layer="2566" from-port="2" to-layer="2568" to-port="0" /> <edge from-layer="2567" from-port="0" to-layer="2568" to-port="1" /> <edge from-layer="2568" from-port="2" to-layer="2573" to-port="0" /> <edge from-layer="2568" from-port="2" to-layer="2569" to-port="0" /> <edge from-layer="2568" from-port="2" to-layer="2580" to-port="0" /> <edge from-layer="2569" from-port="2" to-layer="2583" to-port="0" /> <edge from-layer="2570" from-port="0" to-layer="2573" to-port="1" /> <edge from-layer="2571" from-port="0" to-layer="2573" to-port="2" /> <edge from-layer="2572" from-port="0" to-layer="2573" to-port="3" /> <edge from-layer="2573" from-port="5" to-layer="2576" to-port="0" /> <edge from-layer="2574" from-port="0" to-layer="2575" to-port="0" /> <edge from-layer="2575" from-port="1" to-layer="2576" to-port="1" /> <edge from-layer="2576" from-port="2" to-layer="2581" to-port="0" /> <edge from-layer="2577" from-port="0" to-layer="2580" to-port="1" /> <edge from-layer="2578" from-port="0" to-layer="2580" to-port="2" /> <edge from-layer="2579" from-port="0" to-layer="2580" to-port="3" /> <edge from-layer="2580" from-port="5" to-layer="2581" to-port="1" /> <edge from-layer="2581" from-port="2" to-layer="2582" to-port="0" /> <edge from-layer="2582" from-port="2" to-layer="2583" to-port="1" /> <edge from-layer="2583" from-port="2" to-layer="2584" to-port="1" /> <edge from-layer="2584" from-port="2" to-layer="4290" to-port="0" /> <edge from-layer="2584" from-port="2" to-layer="2604" to-port="1" /> <edge from-layer="2585" from-port="0" to-layer="2586" to-port="0" /> <edge from-layer="2586" from-port="1" to-layer="2591" to-port="0" /> <edge from-layer="2587" from-port="0" to-layer="2590" to-port="1" /> <edge from-layer="2588" from-port="0" to-layer="2590" to-port="2" /> <edge from-layer="2589" from-port="0" to-layer="2590" to-port="3" /> <edge from-layer="2590" from-port="4" to-layer="2591" to-port="1" /> <edge from-layer="2591" from-port="2" to-layer="2592" to-port="0" /> <edge from-layer="2592" from-port="1" to-layer="2594" to-port="0" /> <edge from-layer="2593" from-port="0" to-layer="2594" to-port="2" /> <edge from-layer="2594" from-port="3" to-layer="2603" to-port="0" /> <edge from-layer="2595" from-port="0" to-layer="2598" to-port="1" /> <edge from-layer="2596" from-port="0" to-layer="2598" to-port="2" /> <edge from-layer="2597" from-port="0" to-layer="2598" to-port="3" /> <edge from-layer="2598" from-port="5" to-layer="2600" to-port="0" /> <edge from-layer="2599" from-port="0" to-layer="2600" to-port="1" /> <edge from-layer="2600" from-port="2" to-layer="2602" to-port="0" /> <edge from-layer="2601" from-port="0" to-layer="2602" to-port="1" /> <edge from-layer="2602" from-port="2" to-layer="2603" to-port="1" /> <edge from-layer="2603" from-port="2" to-layer="2604" to-port="2" /> <edge from-layer="2603" from-port="2" to-layer="4289" to-port="0" /> <edge from-layer="2604" from-port="4" to-layer="2606" to-port="0" /> <edge from-layer="2605" from-port="0" to-layer="2606" to-port="1" /> <edge from-layer="2606" from-port="2" to-layer="2608" to-port="0" /> <edge from-layer="2607" from-port="0" to-layer="2608" to-port="1" /> <edge from-layer="2608" from-port="2" to-layer="2611" to-port="0" /> <edge from-layer="2609" from-port="0" to-layer="2610" to-port="0" /> <edge from-layer="2610" from-port="1" to-layer="2611" to-port="1" /> <edge from-layer="2611" from-port="2" to-layer="2612" to-port="1" /> <edge from-layer="2612" from-port="2" to-layer="2638" to-port="0" /> <edge from-layer="2612" from-port="2" to-layer="2619" to-port="0" /> <edge from-layer="2612" from-port="2" to-layer="2627" to-port="0" /> <edge from-layer="2613" from-port="0" to-layer="2614" to-port="0" /> <edge from-layer="2614" from-port="1" to-layer="2628" to-port="0" /> <edge from-layer="2615" from-port="0" to-layer="2616" to-port="0" /> <edge from-layer="2616" from-port="1" to-layer="2626" to-port="0" /> <edge from-layer="2617" from-port="0" to-layer="2618" to-port="0" /> <edge from-layer="2618" from-port="1" to-layer="2619" to-port="1" /> <edge from-layer="2619" from-port="2" to-layer="2621" to-port="0" /> <edge from-layer="2620" from-port="0" to-layer="2621" to-port="1" /> <edge from-layer="2621" from-port="2" to-layer="2624" to-port="0" /> <edge from-layer="2622" from-port="0" to-layer="2623" to-port="0" /> <edge from-layer="2623" from-port="1" to-layer="2624" to-port="1" /> <edge from-layer="2624" from-port="2" to-layer="2625" to-port="0" /> <edge from-layer="2625" from-port="1" to-layer="2626" to-port="1" /> <edge from-layer="2626" from-port="2" to-layer="2627" to-port="1" /> <edge from-layer="2627" from-port="2" to-layer="2628" to-port="1" /> <edge from-layer="2628" from-port="2" to-layer="2631" to-port="0" /> <edge from-layer="2629" from-port="0" to-layer="2630" to-port="0" /> <edge from-layer="2630" from-port="1" to-layer="2631" to-port="1" /> <edge from-layer="2631" from-port="2" to-layer="2632" to-port="0" /> <edge from-layer="2632" from-port="3" to-layer="2633" to-port="0" /> <edge from-layer="2632" from-port="4" to-layer="2634" to-port="0" /> <edge from-layer="2633" from-port="1" to-layer="2634" to-port="1" /> <edge from-layer="2634" from-port="2" to-layer="2637" to-port="0" /> <edge from-layer="2635" from-port="0" to-layer="2636" to-port="0" /> <edge from-layer="2636" from-port="1" to-layer="2637" to-port="1" /> <edge from-layer="2637" from-port="2" to-layer="2638" to-port="1" /> <edge from-layer="2638" from-port="2" to-layer="2645" to-port="0" /> <edge from-layer="2638" from-port="2" to-layer="2742" to-port="0" /> <edge from-layer="2638" from-port="2" to-layer="2653" to-port="0" /> <edge from-layer="2639" from-port="0" to-layer="2640" to-port="0" /> <edge from-layer="2640" from-port="1" to-layer="2654" to-port="0" /> <edge from-layer="2641" from-port="0" to-layer="2642" to-port="0" /> <edge from-layer="2642" from-port="1" to-layer="2652" to-port="0" /> <edge from-layer="2643" from-port="0" to-layer="2644" to-port="0" /> <edge from-layer="2644" from-port="1" to-layer="2645" to-port="1" /> <edge from-layer="2645" from-port="2" to-layer="2647" to-port="0" /> <edge from-layer="2646" from-port="0" to-layer="2647" to-port="1" /> <edge from-layer="2647" from-port="2" to-layer="2650" to-port="0" /> <edge from-layer="2648" from-port="0" to-layer="2649" to-port="0" /> <edge from-layer="2649" from-port="1" to-layer="2650" to-port="1" /> <edge from-layer="2650" from-port="2" to-layer="2651" to-port="0" /> <edge from-layer="2651" from-port="1" to-layer="2652" to-port="1" /> <edge from-layer="2652" from-port="2" to-layer="2653" to-port="1" /> <edge from-layer="2653" from-port="2" to-layer="2654" to-port="1" /> <edge from-layer="2654" from-port="2" to-layer="2657" to-port="0" /> <edge from-layer="2655" from-port="0" to-layer="2656" to-port="0" /> <edge from-layer="2656" from-port="1" to-layer="2657" to-port="1" /> <edge from-layer="2657" from-port="2" to-layer="2728" to-port="0" /> <edge from-layer="2657" from-port="2" to-layer="2694" to-port="0" /> <edge from-layer="2657" from-port="2" to-layer="2661" to-port="0" /> <edge from-layer="2658" from-port="0" to-layer="2661" to-port="1" /> <edge from-layer="2659" from-port="0" to-layer="2661" to-port="2" /> <edge from-layer="2660" from-port="0" to-layer="2661" to-port="3" /> <edge from-layer="2661" from-port="5" to-layer="2663" to-port="0" /> <edge from-layer="2662" from-port="0" to-layer="2663" to-port="1" /> <edge from-layer="2663" from-port="2" to-layer="2665" to-port="0" /> <edge from-layer="2664" from-port="0" to-layer="2665" to-port="1" /> <edge from-layer="2665" from-port="2" to-layer="2677" to-port="0" /> <edge from-layer="2665" from-port="2" to-layer="2666" to-port="0" /> <edge from-layer="2665" from-port="2" to-layer="2670" to-port="0" /> <edge from-layer="2666" from-port="2" to-layer="2680" to-port="0" /> <edge from-layer="2667" from-port="0" to-layer="2670" to-port="1" /> <edge from-layer="2668" from-port="0" to-layer="2670" to-port="2" /> <edge from-layer="2669" from-port="0" to-layer="2670" to-port="3" /> <edge from-layer="2670" from-port="5" to-layer="2673" to-port="0" /> <edge from-layer="2671" from-port="0" to-layer="2672" to-port="0" /> <edge from-layer="2672" from-port="1" to-layer="2673" to-port="1" /> <edge from-layer="2673" from-port="2" to-layer="2678" to-port="0" /> <edge from-layer="2674" from-port="0" to-layer="2677" to-port="1" /> <edge from-layer="2675" from-port="0" to-layer="2677" to-port="2" /> <edge from-layer="2676" from-port="0" to-layer="2677" to-port="3" /> <edge from-layer="2677" from-port="5" to-layer="2678" to-port="1" /> <edge from-layer="2678" from-port="2" to-layer="2679" to-port="0" /> <edge from-layer="2679" from-port="2" to-layer="2680" to-port="1" /> <edge from-layer="2680" from-port="2" to-layer="2734" to-port="0" /> <edge from-layer="2681" from-port="0" to-layer="2682" to-port="0" /> <edge from-layer="2682" from-port="1" to-layer="2687" to-port="0" /> <edge from-layer="2683" from-port="0" to-layer="2686" to-port="1" /> <edge from-layer="2684" from-port="0" to-layer="2686" to-port="2" /> <edge from-layer="2685" from-port="0" to-layer="2686" to-port="3" /> <edge from-layer="2686" from-port="4" to-layer="2687" to-port="1" /> <edge from-layer="2687" from-port="2" to-layer="2688" to-port="0" /> <edge from-layer="2688" from-port="1" to-layer="2690" to-port="0" /> <edge from-layer="2689" from-port="0" to-layer="2690" to-port="2" /> <edge from-layer="2690" from-port="3" to-layer="2714" to-port="0" /> <edge from-layer="2691" from-port="0" to-layer="2694" to-port="1" /> <edge from-layer="2692" from-port="0" to-layer="2694" to-port="2" /> <edge from-layer="2693" from-port="0" to-layer="2694" to-port="3" /> <edge from-layer="2694" from-port="5" to-layer="2696" to-port="0" /> <edge from-layer="2695" from-port="0" to-layer="2696" to-port="1" /> <edge from-layer="2696" from-port="2" to-layer="2698" to-port="0" /> <edge from-layer="2697" from-port="0" to-layer="2698" to-port="1" /> <edge from-layer="2698" from-port="2" to-layer="2699" to-port="0" /> <edge from-layer="2698" from-port="2" to-layer="2703" to-port="0" /> <edge from-layer="2698" from-port="2" to-layer="2710" to-port="0" /> <edge from-layer="2699" from-port="2" to-layer="2713" to-port="0" /> <edge from-layer="2700" from-port="0" to-layer="2703" to-port="1" /> <edge from-layer="2701" from-port="0" to-layer="2703" to-port="2" /> <edge from-layer="2702" from-port="0" to-layer="2703" to-port="3" /> <edge from-layer="2703" from-port="5" to-layer="2706" to-port="0" /> <edge from-layer="2704" from-port="0" to-layer="2705" to-port="0" /> <edge from-layer="2705" from-port="1" to-layer="2706" to-port="1" /> <edge from-layer="2706" from-port="2" to-layer="2711" to-port="0" /> <edge from-layer="2707" from-port="0" to-layer="2710" to-port="1" /> <edge from-layer="2708" from-port="0" to-layer="2710" to-port="2" /> <edge from-layer="2709" from-port="0" to-layer="2710" to-port="3" /> <edge from-layer="2710" from-port="5" to-layer="2711" to-port="1" /> <edge from-layer="2711" from-port="2" to-layer="2712" to-port="0" /> <edge from-layer="2712" from-port="2" to-layer="2713" to-port="1" /> <edge from-layer="2713" from-port="2" to-layer="2714" to-port="1" /> <edge from-layer="2714" from-port="2" to-layer="2734" to-port="1" /> <edge from-layer="2714" from-port="2" to-layer="4288" to-port="0" /> <edge from-layer="2715" from-port="0" to-layer="2716" to-port="0" /> <edge from-layer="2716" from-port="1" to-layer="2721" to-port="0" /> <edge from-layer="2717" from-port="0" to-layer="2720" to-port="1" /> <edge from-layer="2718" from-port="0" to-layer="2720" to-port="2" /> <edge from-layer="2719" from-port="0" to-layer="2720" to-port="3" /> <edge from-layer="2720" from-port="4" to-layer="2721" to-port="1" /> <edge from-layer="2721" from-port="2" to-layer="2722" to-port="0" /> <edge from-layer="2722" from-port="1" to-layer="2724" to-port="0" /> <edge from-layer="2723" from-port="0" to-layer="2724" to-port="2" /> <edge from-layer="2724" from-port="3" to-layer="2733" to-port="0" /> <edge from-layer="2725" from-port="0" to-layer="2728" to-port="1" /> <edge from-layer="2726" from-port="0" to-layer="2728" to-port="2" /> <edge from-layer="2727" from-port="0" to-layer="2728" to-port="3" /> <edge from-layer="2728" from-port="5" to-layer="2730" to-port="0" /> <edge from-layer="2729" from-port="0" to-layer="2730" to-port="1" /> <edge from-layer="2730" from-port="2" to-layer="2732" to-port="0" /> <edge from-layer="2731" from-port="0" to-layer="2732" to-port="1" /> <edge from-layer="2732" from-port="2" to-layer="2733" to-port="1" /> <edge from-layer="2733" from-port="2" to-layer="4287" to-port="0" /> <edge from-layer="2733" from-port="2" to-layer="2734" to-port="2" /> <edge from-layer="2734" from-port="4" to-layer="2736" to-port="0" /> <edge from-layer="2735" from-port="0" to-layer="2736" to-port="1" /> <edge from-layer="2736" from-port="2" to-layer="2738" to-port="0" /> <edge from-layer="2737" from-port="0" to-layer="2738" to-port="1" /> <edge from-layer="2738" from-port="2" to-layer="2741" to-port="0" /> <edge from-layer="2739" from-port="0" to-layer="2740" to-port="0" /> <edge from-layer="2740" from-port="1" to-layer="2741" to-port="1" /> <edge from-layer="2741" from-port="2" to-layer="2742" to-port="1" /> <edge from-layer="2742" from-port="2" to-layer="2749" to-port="0" /> <edge from-layer="2742" from-port="2" to-layer="2768" to-port="0" /> <edge from-layer="2742" from-port="2" to-layer="2757" to-port="0" /> <edge from-layer="2743" from-port="0" to-layer="2744" to-port="0" /> <edge from-layer="2744" from-port="1" to-layer="2758" to-port="0" /> <edge from-layer="2745" from-port="0" to-layer="2746" to-port="0" /> <edge from-layer="2746" from-port="1" to-layer="2756" to-port="0" /> <edge from-layer="2747" from-port="0" to-layer="2748" to-port="0" /> <edge from-layer="2748" from-port="1" to-layer="2749" to-port="1" /> <edge from-layer="2749" from-port="2" to-layer="2751" to-port="0" /> <edge from-layer="2750" from-port="0" to-layer="2751" to-port="1" /> <edge from-layer="2751" from-port="2" to-layer="2754" to-port="0" /> <edge from-layer="2752" from-port="0" to-layer="2753" to-port="0" /> <edge from-layer="2753" from-port="1" to-layer="2754" to-port="1" /> <edge from-layer="2754" from-port="2" to-layer="2755" to-port="0" /> <edge from-layer="2755" from-port="1" to-layer="2756" to-port="1" /> <edge from-layer="2756" from-port="2" to-layer="2757" to-port="1" /> <edge from-layer="2757" from-port="2" to-layer="2758" to-port="1" /> <edge from-layer="2758" from-port="2" to-layer="2761" to-port="0" /> <edge from-layer="2759" from-port="0" to-layer="2760" to-port="0" /> <edge from-layer="2760" from-port="1" to-layer="2761" to-port="1" /> <edge from-layer="2761" from-port="2" to-layer="2762" to-port="0" /> <edge from-layer="2762" from-port="3" to-layer="2763" to-port="0" /> <edge from-layer="2762" from-port="4" to-layer="2764" to-port="0" /> <edge from-layer="2763" from-port="1" to-layer="2764" to-port="1" /> <edge from-layer="2764" from-port="2" to-layer="2767" to-port="0" /> <edge from-layer="2765" from-port="0" to-layer="2766" to-port="0" /> <edge from-layer="2766" from-port="1" to-layer="2767" to-port="1" /> <edge from-layer="2767" from-port="2" to-layer="2768" to-port="1" /> <edge from-layer="2768" from-port="2" to-layer="2872" to-port="0" /> <edge from-layer="2768" from-port="2" to-layer="2783" to-port="0" /> <edge from-layer="2768" from-port="2" to-layer="2775" to-port="0" /> <edge from-layer="2769" from-port="0" to-layer="2770" to-port="0" /> <edge from-layer="2770" from-port="1" to-layer="2784" to-port="0" /> <edge from-layer="2771" from-port="0" to-layer="2772" to-port="0" /> <edge from-layer="2772" from-port="1" to-layer="2782" to-port="0" /> <edge from-layer="2773" from-port="0" to-layer="2774" to-port="0" /> <edge from-layer="2774" from-port="1" to-layer="2775" to-port="1" /> <edge from-layer="2775" from-port="2" to-layer="2777" to-port="0" /> <edge from-layer="2776" from-port="0" to-layer="2777" to-port="1" /> <edge from-layer="2777" from-port="2" to-layer="2780" to-port="0" /> <edge from-layer="2778" from-port="0" to-layer="2779" to-port="0" /> <edge from-layer="2779" from-port="1" to-layer="2780" to-port="1" /> <edge from-layer="2780" from-port="2" to-layer="2781" to-port="0" /> <edge from-layer="2781" from-port="1" to-layer="2782" to-port="1" /> <edge from-layer="2782" from-port="2" to-layer="2783" to-port="1" /> <edge from-layer="2783" from-port="2" to-layer="2784" to-port="1" /> <edge from-layer="2784" from-port="2" to-layer="2787" to-port="0" /> <edge from-layer="2785" from-port="0" to-layer="2786" to-port="0" /> <edge from-layer="2786" from-port="1" to-layer="2787" to-port="1" /> <edge from-layer="2787" from-port="2" to-layer="2824" to-port="0" /> <edge from-layer="2787" from-port="2" to-layer="2791" to-port="0" /> <edge from-layer="2787" from-port="2" to-layer="2858" to-port="0" /> <edge from-layer="2788" from-port="0" to-layer="2791" to-port="1" /> <edge from-layer="2789" from-port="0" to-layer="2791" to-port="2" /> <edge from-layer="2790" from-port="0" to-layer="2791" to-port="3" /> <edge from-layer="2791" from-port="5" to-layer="2793" to-port="0" /> <edge from-layer="2792" from-port="0" to-layer="2793" to-port="1" /> <edge from-layer="2793" from-port="2" to-layer="2795" to-port="0" /> <edge from-layer="2794" from-port="0" to-layer="2795" to-port="1" /> <edge from-layer="2795" from-port="2" to-layer="2807" to-port="0" /> <edge from-layer="2795" from-port="2" to-layer="2796" to-port="0" /> <edge from-layer="2795" from-port="2" to-layer="2800" to-port="0" /> <edge from-layer="2796" from-port="2" to-layer="2810" to-port="0" /> <edge from-layer="2797" from-port="0" to-layer="2800" to-port="1" /> <edge from-layer="2798" from-port="0" to-layer="2800" to-port="2" /> <edge from-layer="2799" from-port="0" to-layer="2800" to-port="3" /> <edge from-layer="2800" from-port="5" to-layer="2803" to-port="0" /> <edge from-layer="2801" from-port="0" to-layer="2802" to-port="0" /> <edge from-layer="2802" from-port="1" to-layer="2803" to-port="1" /> <edge from-layer="2803" from-port="2" to-layer="2808" to-port="0" /> <edge from-layer="2804" from-port="0" to-layer="2807" to-port="1" /> <edge from-layer="2805" from-port="0" to-layer="2807" to-port="2" /> <edge from-layer="2806" from-port="0" to-layer="2807" to-port="3" /> <edge from-layer="2807" from-port="5" to-layer="2808" to-port="1" /> <edge from-layer="2808" from-port="2" to-layer="2809" to-port="0" /> <edge from-layer="2809" from-port="2" to-layer="2810" to-port="1" /> <edge from-layer="2810" from-port="2" to-layer="2864" to-port="0" /> <edge from-layer="2811" from-port="0" to-layer="2812" to-port="0" /> <edge from-layer="2812" from-port="1" to-layer="2817" to-port="0" /> <edge from-layer="2813" from-port="0" to-layer="2816" to-port="1" /> <edge from-layer="2814" from-port="0" to-layer="2816" to-port="2" /> <edge from-layer="2815" from-port="0" to-layer="2816" to-port="3" /> <edge from-layer="2816" from-port="4" to-layer="2817" to-port="1" /> <edge from-layer="2817" from-port="2" to-layer="2818" to-port="0" /> <edge from-layer="2818" from-port="1" to-layer="2820" to-port="0" /> <edge from-layer="2819" from-port="0" to-layer="2820" to-port="2" /> <edge from-layer="2820" from-port="3" to-layer="2844" to-port="0" /> <edge from-layer="2821" from-port="0" to-layer="2824" to-port="1" /> <edge from-layer="2822" from-port="0" to-layer="2824" to-port="2" /> <edge from-layer="2823" from-port="0" to-layer="2824" to-port="3" /> <edge from-layer="2824" from-port="5" to-layer="2826" to-port="0" /> <edge from-layer="2825" from-port="0" to-layer="2826" to-port="1" /> <edge from-layer="2826" from-port="2" to-layer="2828" to-port="0" /> <edge from-layer="2827" from-port="0" to-layer="2828" to-port="1" /> <edge from-layer="2828" from-port="2" to-layer="2833" to-port="0" /> <edge from-layer="2828" from-port="2" to-layer="2829" to-port="0" /> <edge from-layer="2828" from-port="2" to-layer="2840" to-port="0" /> <edge from-layer="2829" from-port="2" to-layer="2843" to-port="0" /> <edge from-layer="2830" from-port="0" to-layer="2833" to-port="1" /> <edge from-layer="2831" from-port="0" to-layer="2833" to-port="2" /> <edge from-layer="2832" from-port="0" to-layer="2833" to-port="3" /> <edge from-layer="2833" from-port="5" to-layer="2836" to-port="0" /> <edge from-layer="2834" from-port="0" to-layer="2835" to-port="0" /> <edge from-layer="2835" from-port="1" to-layer="2836" to-port="1" /> <edge from-layer="2836" from-port="2" to-layer="2841" to-port="0" /> <edge from-layer="2837" from-port="0" to-layer="2840" to-port="1" /> <edge from-layer="2838" from-port="0" to-layer="2840" to-port="2" /> <edge from-layer="2839" from-port="0" to-layer="2840" to-port="3" /> <edge from-layer="2840" from-port="5" to-layer="2841" to-port="1" /> <edge from-layer="2841" from-port="2" to-layer="2842" to-port="0" /> <edge from-layer="2842" from-port="2" to-layer="2843" to-port="1" /> <edge from-layer="2843" from-port="2" to-layer="2844" to-port="1" /> <edge from-layer="2844" from-port="2" to-layer="2864" to-port="1" /> <edge from-layer="2844" from-port="2" to-layer="4284" to-port="0" /> <edge from-layer="2845" from-port="0" to-layer="2846" to-port="0" /> <edge from-layer="2846" from-port="1" to-layer="2851" to-port="0" /> <edge from-layer="2847" from-port="0" to-layer="2850" to-port="1" /> <edge from-layer="2848" from-port="0" to-layer="2850" to-port="2" /> <edge from-layer="2849" from-port="0" to-layer="2850" to-port="3" /> <edge from-layer="2850" from-port="4" to-layer="2851" to-port="1" /> <edge from-layer="2851" from-port="2" to-layer="2852" to-port="0" /> <edge from-layer="2852" from-port="1" to-layer="2854" to-port="0" /> <edge from-layer="2853" from-port="0" to-layer="2854" to-port="2" /> <edge from-layer="2854" from-port="3" to-layer="2863" to-port="0" /> <edge from-layer="2855" from-port="0" to-layer="2858" to-port="1" /> <edge from-layer="2856" from-port="0" to-layer="2858" to-port="2" /> <edge from-layer="2857" from-port="0" to-layer="2858" to-port="3" /> <edge from-layer="2858" from-port="5" to-layer="2860" to-port="0" /> <edge from-layer="2859" from-port="0" to-layer="2860" to-port="1" /> <edge from-layer="2860" from-port="2" to-layer="2862" to-port="0" /> <edge from-layer="2861" from-port="0" to-layer="2862" to-port="1" /> <edge from-layer="2862" from-port="2" to-layer="2863" to-port="1" /> <edge from-layer="2863" from-port="2" to-layer="4283" to-port="0" /> <edge from-layer="2863" from-port="2" to-layer="2864" to-port="2" /> <edge from-layer="2864" from-port="4" to-layer="2866" to-port="0" /> <edge from-layer="2865" from-port="0" to-layer="2866" to-port="1" /> <edge from-layer="2866" from-port="2" to-layer="2868" to-port="0" /> <edge from-layer="2867" from-port="0" to-layer="2868" to-port="1" /> <edge from-layer="2868" from-port="2" to-layer="2871" to-port="0" /> <edge from-layer="2869" from-port="0" to-layer="2870" to-port="0" /> <edge from-layer="2870" from-port="1" to-layer="2871" to-port="1" /> <edge from-layer="2871" from-port="2" to-layer="2872" to-port="1" /> <edge from-layer="2872" from-port="2" to-layer="2898" to-port="0" /> <edge from-layer="2872" from-port="2" to-layer="2887" to-port="0" /> <edge from-layer="2872" from-port="2" to-layer="2879" to-port="0" /> <edge from-layer="2873" from-port="0" to-layer="2874" to-port="0" /> <edge from-layer="2874" from-port="1" to-layer="2888" to-port="0" /> <edge from-layer="2875" from-port="0" to-layer="2876" to-port="0" /> <edge from-layer="2876" from-port="1" to-layer="2886" to-port="0" /> <edge from-layer="2877" from-port="0" to-layer="2878" to-port="0" /> <edge from-layer="2878" from-port="1" to-layer="2879" to-port="1" /> <edge from-layer="2879" from-port="2" to-layer="2881" to-port="0" /> <edge from-layer="2880" from-port="0" to-layer="2881" to-port="1" /> <edge from-layer="2881" from-port="2" to-layer="2884" to-port="0" /> <edge from-layer="2882" from-port="0" to-layer="2883" to-port="0" /> <edge from-layer="2883" from-port="1" to-layer="2884" to-port="1" /> <edge from-layer="2884" from-port="2" to-layer="2885" to-port="0" /> <edge from-layer="2885" from-port="1" to-layer="2886" to-port="1" /> <edge from-layer="2886" from-port="2" to-layer="2887" to-port="1" /> <edge from-layer="2887" from-port="2" to-layer="2888" to-port="1" /> <edge from-layer="2888" from-port="2" to-layer="2891" to-port="0" /> <edge from-layer="2889" from-port="0" to-layer="2890" to-port="0" /> <edge from-layer="2890" from-port="1" to-layer="2891" to-port="1" /> <edge from-layer="2891" from-port="2" to-layer="2892" to-port="0" /> <edge from-layer="2892" from-port="3" to-layer="2893" to-port="0" /> <edge from-layer="2892" from-port="4" to-layer="2894" to-port="0" /> <edge from-layer="2893" from-port="1" to-layer="2894" to-port="1" /> <edge from-layer="2894" from-port="2" to-layer="2897" to-port="0" /> <edge from-layer="2895" from-port="0" to-layer="2896" to-port="0" /> <edge from-layer="2896" from-port="1" to-layer="2897" to-port="1" /> <edge from-layer="2897" from-port="2" to-layer="2898" to-port="1" /> <edge from-layer="2898" from-port="2" to-layer="2913" to-port="0" /> <edge from-layer="2898" from-port="2" to-layer="3002" to-port="0" /> <edge from-layer="2898" from-port="2" to-layer="2905" to-port="0" /> <edge from-layer="2899" from-port="0" to-layer="2900" to-port="0" /> <edge from-layer="2900" from-port="1" to-layer="2914" to-port="0" /> <edge from-layer="2901" from-port="0" to-layer="2902" to-port="0" /> <edge from-layer="2902" from-port="1" to-layer="2912" to-port="0" /> <edge from-layer="2903" from-port="0" to-layer="2904" to-port="0" /> <edge from-layer="2904" from-port="1" to-layer="2905" to-port="1" /> <edge from-layer="2905" from-port="2" to-layer="2907" to-port="0" /> <edge from-layer="2906" from-port="0" to-layer="2907" to-port="1" /> <edge from-layer="2907" from-port="2" to-layer="2910" to-port="0" /> <edge from-layer="2908" from-port="0" to-layer="2909" to-port="0" /> <edge from-layer="2909" from-port="1" to-layer="2910" to-port="1" /> <edge from-layer="2910" from-port="2" to-layer="2911" to-port="0" /> <edge from-layer="2911" from-port="1" to-layer="2912" to-port="1" /> <edge from-layer="2912" from-port="2" to-layer="2913" to-port="1" /> <edge from-layer="2913" from-port="2" to-layer="2914" to-port="1" /> <edge from-layer="2914" from-port="2" to-layer="2917" to-port="0" /> <edge from-layer="2915" from-port="0" to-layer="2916" to-port="0" /> <edge from-layer="2916" from-port="1" to-layer="2917" to-port="1" /> <edge from-layer="2917" from-port="2" to-layer="2988" to-port="0" /> <edge from-layer="2917" from-port="2" to-layer="2954" to-port="0" /> <edge from-layer="2917" from-port="2" to-layer="2921" to-port="0" /> <edge from-layer="2918" from-port="0" to-layer="2921" to-port="1" /> <edge from-layer="2919" from-port="0" to-layer="2921" to-port="2" /> <edge from-layer="2920" from-port="0" to-layer="2921" to-port="3" /> <edge from-layer="2921" from-port="5" to-layer="2923" to-port="0" /> <edge from-layer="2922" from-port="0" to-layer="2923" to-port="1" /> <edge from-layer="2923" from-port="2" to-layer="2925" to-port="0" /> <edge from-layer="2924" from-port="0" to-layer="2925" to-port="1" /> <edge from-layer="2925" from-port="2" to-layer="2937" to-port="0" /> <edge from-layer="2925" from-port="2" to-layer="2930" to-port="0" /> <edge from-layer="2925" from-port="2" to-layer="2926" to-port="0" /> <edge from-layer="2926" from-port="2" to-layer="2940" to-port="0" /> <edge from-layer="2927" from-port="0" to-layer="2930" to-port="1" /> <edge from-layer="2928" from-port="0" to-layer="2930" to-port="2" /> <edge from-layer="2929" from-port="0" to-layer="2930" to-port="3" /> <edge from-layer="2930" from-port="5" to-layer="2933" to-port="0" /> <edge from-layer="2931" from-port="0" to-layer="2932" to-port="0" /> <edge from-layer="2932" from-port="1" to-layer="2933" to-port="1" /> <edge from-layer="2933" from-port="2" to-layer="2938" to-port="0" /> <edge from-layer="2934" from-port="0" to-layer="2937" to-port="1" /> <edge from-layer="2935" from-port="0" to-layer="2937" to-port="2" /> <edge from-layer="2936" from-port="0" to-layer="2937" to-port="3" /> <edge from-layer="2937" from-port="5" to-layer="2938" to-port="1" /> <edge from-layer="2938" from-port="2" to-layer="2939" to-port="0" /> <edge from-layer="2939" from-port="2" to-layer="2940" to-port="1" /> <edge from-layer="2940" from-port="2" to-layer="2994" to-port="0" /> <edge from-layer="2941" from-port="0" to-layer="2942" to-port="0" /> <edge from-layer="2942" from-port="1" to-layer="2947" to-port="0" /> <edge from-layer="2943" from-port="0" to-layer="2946" to-port="1" /> <edge from-layer="2944" from-port="0" to-layer="2946" to-port="2" /> <edge from-layer="2945" from-port="0" to-layer="2946" to-port="3" /> <edge from-layer="2946" from-port="4" to-layer="2947" to-port="1" /> <edge from-layer="2947" from-port="2" to-layer="2948" to-port="0" /> <edge from-layer="2948" from-port="1" to-layer="2950" to-port="0" /> <edge from-layer="2949" from-port="0" to-layer="2950" to-port="2" /> <edge from-layer="2950" from-port="3" to-layer="2974" to-port="0" /> <edge from-layer="2951" from-port="0" to-layer="2954" to-port="1" /> <edge from-layer="2952" from-port="0" to-layer="2954" to-port="2" /> <edge from-layer="2953" from-port="0" to-layer="2954" to-port="3" /> <edge from-layer="2954" from-port="5" to-layer="2956" to-port="0" /> <edge from-layer="2955" from-port="0" to-layer="2956" to-port="1" /> <edge from-layer="2956" from-port="2" to-layer="2958" to-port="0" /> <edge from-layer="2957" from-port="0" to-layer="2958" to-port="1" /> <edge from-layer="2958" from-port="2" to-layer="2970" to-port="0" /> <edge from-layer="2958" from-port="2" to-layer="2959" to-port="0" /> <edge from-layer="2958" from-port="2" to-layer="2963" to-port="0" /> <edge from-layer="2959" from-port="2" to-layer="2973" to-port="0" /> <edge from-layer="2960" from-port="0" to-layer="2963" to-port="1" /> <edge from-layer="2961" from-port="0" to-layer="2963" to-port="2" /> <edge from-layer="2962" from-port="0" to-layer="2963" to-port="3" /> <edge from-layer="2963" from-port="5" to-layer="2966" to-port="0" /> <edge from-layer="2964" from-port="0" to-layer="2965" to-port="0" /> <edge from-layer="2965" from-port="1" to-layer="2966" to-port="1" /> <edge from-layer="2966" from-port="2" to-layer="2971" to-port="0" /> <edge from-layer="2967" from-port="0" to-layer="2970" to-port="1" /> <edge from-layer="2968" from-port="0" to-layer="2970" to-port="2" /> <edge from-layer="2969" from-port="0" to-layer="2970" to-port="3" /> <edge from-layer="2970" from-port="5" to-layer="2971" to-port="1" /> <edge from-layer="2971" from-port="2" to-layer="2972" to-port="0" /> <edge from-layer="2972" from-port="2" to-layer="2973" to-port="1" /> <edge from-layer="2973" from-port="2" to-layer="2974" to-port="1" /> <edge from-layer="2974" from-port="2" to-layer="2994" to-port="1" /> <edge from-layer="2974" from-port="2" to-layer="4282" to-port="0" /> <edge from-layer="2975" from-port="0" to-layer="2976" to-port="0" /> <edge from-layer="2976" from-port="1" to-layer="2981" to-port="0" /> <edge from-layer="2977" from-port="0" to-layer="2980" to-port="1" /> <edge from-layer="2978" from-port="0" to-layer="2980" to-port="2" /> <edge from-layer="2979" from-port="0" to-layer="2980" to-port="3" /> <edge from-layer="2980" from-port="4" to-layer="2981" to-port="1" /> <edge from-layer="2981" from-port="2" to-layer="2982" to-port="0" /> <edge from-layer="2982" from-port="1" to-layer="2984" to-port="0" /> <edge from-layer="2983" from-port="0" to-layer="2984" to-port="2" /> <edge from-layer="2984" from-port="3" to-layer="2993" to-port="0" /> <edge from-layer="2985" from-port="0" to-layer="2988" to-port="1" /> <edge from-layer="2986" from-port="0" to-layer="2988" to-port="2" /> <edge from-layer="2987" from-port="0" to-layer="2988" to-port="3" /> <edge from-layer="2988" from-port="5" to-layer="2990" to-port="0" /> <edge from-layer="2989" from-port="0" to-layer="2990" to-port="1" /> <edge from-layer="2990" from-port="2" to-layer="2992" to-port="0" /> <edge from-layer="2991" from-port="0" to-layer="2992" to-port="1" /> <edge from-layer="2992" from-port="2" to-layer="2993" to-port="1" /> <edge from-layer="2993" from-port="2" to-layer="4281" to-port="0" /> <edge from-layer="2993" from-port="2" to-layer="2994" to-port="2" /> <edge from-layer="2994" from-port="4" to-layer="2996" to-port="0" /> <edge from-layer="2995" from-port="0" to-layer="2996" to-port="1" /> <edge from-layer="2996" from-port="2" to-layer="2998" to-port="0" /> <edge from-layer="2997" from-port="0" to-layer="2998" to-port="1" /> <edge from-layer="2998" from-port="2" to-layer="3001" to-port="0" /> <edge from-layer="2999" from-port="0" to-layer="3000" to-port="0" /> <edge from-layer="3000" from-port="1" to-layer="3001" to-port="1" /> <edge from-layer="3001" from-port="2" to-layer="3002" to-port="1" /> <edge from-layer="3002" from-port="2" to-layer="3017" to-port="0" /> <edge from-layer="3002" from-port="2" to-layer="3028" to-port="0" /> <edge from-layer="3002" from-port="2" to-layer="3009" to-port="0" /> <edge from-layer="3003" from-port="0" to-layer="3004" to-port="0" /> <edge from-layer="3004" from-port="1" to-layer="3018" to-port="0" /> <edge from-layer="3005" from-port="0" to-layer="3006" to-port="0" /> <edge from-layer="3006" from-port="1" to-layer="3016" to-port="0" /> <edge from-layer="3007" from-port="0" to-layer="3008" to-port="0" /> <edge from-layer="3008" from-port="1" to-layer="3009" to-port="1" /> <edge from-layer="3009" from-port="2" to-layer="3011" to-port="0" /> <edge from-layer="3010" from-port="0" to-layer="3011" to-port="1" /> <edge from-layer="3011" from-port="2" to-layer="3014" to-port="0" /> <edge from-layer="3012" from-port="0" to-layer="3013" to-port="0" /> <edge from-layer="3013" from-port="1" to-layer="3014" to-port="1" /> <edge from-layer="3014" from-port="2" to-layer="3015" to-port="0" /> <edge from-layer="3015" from-port="1" to-layer="3016" to-port="1" /> <edge from-layer="3016" from-port="2" to-layer="3017" to-port="1" /> <edge from-layer="3017" from-port="2" to-layer="3018" to-port="1" /> <edge from-layer="3018" from-port="2" to-layer="3021" to-port="0" /> <edge from-layer="3019" from-port="0" to-layer="3020" to-port="0" /> <edge from-layer="3020" from-port="1" to-layer="3021" to-port="1" /> <edge from-layer="3021" from-port="2" to-layer="3022" to-port="0" /> <edge from-layer="3022" from-port="3" to-layer="3023" to-port="0" /> <edge from-layer="3022" from-port="4" to-layer="3024" to-port="0" /> <edge from-layer="3023" from-port="1" to-layer="3024" to-port="1" /> <edge from-layer="3024" from-port="2" to-layer="3027" to-port="0" /> <edge from-layer="3025" from-port="0" to-layer="3026" to-port="0" /> <edge from-layer="3026" from-port="1" to-layer="3027" to-port="1" /> <edge from-layer="3027" from-port="2" to-layer="3028" to-port="1" /> <edge from-layer="3028" from-port="2" to-layer="3035" to-port="0" /> <edge from-layer="3028" from-port="2" to-layer="3132" to-port="0" /> <edge from-layer="3028" from-port="2" to-layer="3043" to-port="0" /> <edge from-layer="3029" from-port="0" to-layer="3030" to-port="0" /> <edge from-layer="3030" from-port="1" to-layer="3044" to-port="0" /> <edge from-layer="3031" from-port="0" to-layer="3032" to-port="0" /> <edge from-layer="3032" from-port="1" to-layer="3042" to-port="0" /> <edge from-layer="3033" from-port="0" to-layer="3034" to-port="0" /> <edge from-layer="3034" from-port="1" to-layer="3035" to-port="1" /> <edge from-layer="3035" from-port="2" to-layer="3037" to-port="0" /> <edge from-layer="3036" from-port="0" to-layer="3037" to-port="1" /> <edge from-layer="3037" from-port="2" to-layer="3040" to-port="0" /> <edge from-layer="3038" from-port="0" to-layer="3039" to-port="0" /> <edge from-layer="3039" from-port="1" to-layer="3040" to-port="1" /> <edge from-layer="3040" from-port="2" to-layer="3041" to-port="0" /> <edge from-layer="3041" from-port="1" to-layer="3042" to-port="1" /> <edge from-layer="3042" from-port="2" to-layer="3043" to-port="1" /> <edge from-layer="3043" from-port="2" to-layer="3044" to-port="1" /> <edge from-layer="3044" from-port="2" to-layer="3047" to-port="0" /> <edge from-layer="3045" from-port="0" to-layer="3046" to-port="0" /> <edge from-layer="3046" from-port="1" to-layer="3047" to-port="1" /> <edge from-layer="3047" from-port="2" to-layer="3084" to-port="0" /> <edge from-layer="3047" from-port="2" to-layer="3051" to-port="0" /> <edge from-layer="3047" from-port="2" to-layer="3118" to-port="0" /> <edge from-layer="3048" from-port="0" to-layer="3051" to-port="1" /> <edge from-layer="3049" from-port="0" to-layer="3051" to-port="2" /> <edge from-layer="3050" from-port="0" to-layer="3051" to-port="3" /> <edge from-layer="3051" from-port="5" to-layer="3053" to-port="0" /> <edge from-layer="3052" from-port="0" to-layer="3053" to-port="1" /> <edge from-layer="3053" from-port="2" to-layer="3055" to-port="0" /> <edge from-layer="3054" from-port="0" to-layer="3055" to-port="1" /> <edge from-layer="3055" from-port="2" to-layer="3060" to-port="0" /> <edge from-layer="3055" from-port="2" to-layer="3056" to-port="0" /> <edge from-layer="3055" from-port="2" to-layer="3067" to-port="0" /> <edge from-layer="3056" from-port="2" to-layer="3070" to-port="0" /> <edge from-layer="3057" from-port="0" to-layer="3060" to-port="1" /> <edge from-layer="3058" from-port="0" to-layer="3060" to-port="2" /> <edge from-layer="3059" from-port="0" to-layer="3060" to-port="3" /> <edge from-layer="3060" from-port="5" to-layer="3063" to-port="0" /> <edge from-layer="3061" from-port="0" to-layer="3062" to-port="0" /> <edge from-layer="3062" from-port="1" to-layer="3063" to-port="1" /> <edge from-layer="3063" from-port="2" to-layer="3068" to-port="0" /> <edge from-layer="3064" from-port="0" to-layer="3067" to-port="1" /> <edge from-layer="3065" from-port="0" to-layer="3067" to-port="2" /> <edge from-layer="3066" from-port="0" to-layer="3067" to-port="3" /> <edge from-layer="3067" from-port="5" to-layer="3068" to-port="1" /> <edge from-layer="3068" from-port="2" to-layer="3069" to-port="0" /> <edge from-layer="3069" from-port="2" to-layer="3070" to-port="1" /> <edge from-layer="3070" from-port="2" to-layer="3124" to-port="0" /> <edge from-layer="3071" from-port="0" to-layer="3072" to-port="0" /> <edge from-layer="3072" from-port="1" to-layer="3077" to-port="0" /> <edge from-layer="3073" from-port="0" to-layer="3076" to-port="1" /> <edge from-layer="3074" from-port="0" to-layer="3076" to-port="2" /> <edge from-layer="3075" from-port="0" to-layer="3076" to-port="3" /> <edge from-layer="3076" from-port="4" to-layer="3077" to-port="1" /> <edge from-layer="3077" from-port="2" to-layer="3078" to-port="0" /> <edge from-layer="3078" from-port="1" to-layer="3080" to-port="0" /> <edge from-layer="3079" from-port="0" to-layer="3080" to-port="2" /> <edge from-layer="3080" from-port="3" to-layer="3104" to-port="0" /> <edge from-layer="3081" from-port="0" to-layer="3084" to-port="1" /> <edge from-layer="3082" from-port="0" to-layer="3084" to-port="2" /> <edge from-layer="3083" from-port="0" to-layer="3084" to-port="3" /> <edge from-layer="3084" from-port="5" to-layer="3086" to-port="0" /> <edge from-layer="3085" from-port="0" to-layer="3086" to-port="1" /> <edge from-layer="3086" from-port="2" to-layer="3088" to-port="0" /> <edge from-layer="3087" from-port="0" to-layer="3088" to-port="1" /> <edge from-layer="3088" from-port="2" to-layer="3093" to-port="0" /> <edge from-layer="3088" from-port="2" to-layer="3089" to-port="0" /> <edge from-layer="3088" from-port="2" to-layer="3100" to-port="0" /> <edge from-layer="3089" from-port="2" to-layer="3103" to-port="0" /> <edge from-layer="3090" from-port="0" to-layer="3093" to-port="1" /> <edge from-layer="3091" from-port="0" to-layer="3093" to-port="2" /> <edge from-layer="3092" from-port="0" to-layer="3093" to-port="3" /> <edge from-layer="3093" from-port="5" to-layer="3096" to-port="0" /> <edge from-layer="3094" from-port="0" to-layer="3095" to-port="0" /> <edge from-layer="3095" from-port="1" to-layer="3096" to-port="1" /> <edge from-layer="3096" from-port="2" to-layer="3101" to-port="0" /> <edge from-layer="3097" from-port="0" to-layer="3100" to-port="1" /> <edge from-layer="3098" from-port="0" to-layer="3100" to-port="2" /> <edge from-layer="3099" from-port="0" to-layer="3100" to-port="3" /> <edge from-layer="3100" from-port="5" to-layer="3101" to-port="1" /> <edge from-layer="3101" from-port="2" to-layer="3102" to-port="0" /> <edge from-layer="3102" from-port="2" to-layer="3103" to-port="1" /> <edge from-layer="3103" from-port="2" to-layer="3104" to-port="1" /> <edge from-layer="3104" from-port="2" to-layer="4280" to-port="0" /> <edge from-layer="3104" from-port="2" to-layer="3124" to-port="1" /> <edge from-layer="3105" from-port="0" to-layer="3106" to-port="0" /> <edge from-layer="3106" from-port="1" to-layer="3111" to-port="0" /> <edge from-layer="3107" from-port="0" to-layer="3110" to-port="1" /> <edge from-layer="3108" from-port="0" to-layer="3110" to-port="2" /> <edge from-layer="3109" from-port="0" to-layer="3110" to-port="3" /> <edge from-layer="3110" from-port="4" to-layer="3111" to-port="1" /> <edge from-layer="3111" from-port="2" to-layer="3112" to-port="0" /> <edge from-layer="3112" from-port="1" to-layer="3114" to-port="0" /> <edge from-layer="3113" from-port="0" to-layer="3114" to-port="2" /> <edge from-layer="3114" from-port="3" to-layer="3123" to-port="0" /> <edge from-layer="3115" from-port="0" to-layer="3118" to-port="1" /> <edge from-layer="3116" from-port="0" to-layer="3118" to-port="2" /> <edge from-layer="3117" from-port="0" to-layer="3118" to-port="3" /> <edge from-layer="3118" from-port="5" to-layer="3120" to-port="0" /> <edge from-layer="3119" from-port="0" to-layer="3120" to-port="1" /> <edge from-layer="3120" from-port="2" to-layer="3122" to-port="0" /> <edge from-layer="3121" from-port="0" to-layer="3122" to-port="1" /> <edge from-layer="3122" from-port="2" to-layer="3123" to-port="1" /> <edge from-layer="3123" from-port="2" to-layer="3124" to-port="2" /> <edge from-layer="3123" from-port="2" to-layer="4279" to-port="0" /> <edge from-layer="3124" from-port="4" to-layer="3126" to-port="0" /> <edge from-layer="3125" from-port="0" to-layer="3126" to-port="1" /> <edge from-layer="3126" from-port="2" to-layer="3128" to-port="0" /> <edge from-layer="3127" from-port="0" to-layer="3128" to-port="1" /> <edge from-layer="3128" from-port="2" to-layer="3131" to-port="0" /> <edge from-layer="3129" from-port="0" to-layer="3130" to-port="0" /> <edge from-layer="3130" from-port="1" to-layer="3131" to-port="1" /> <edge from-layer="3131" from-port="2" to-layer="3132" to-port="1" /> <edge from-layer="3132" from-port="2" to-layer="3158" to-port="0" /> <edge from-layer="3132" from-port="2" to-layer="3139" to-port="0" /> <edge from-layer="3132" from-port="2" to-layer="3147" to-port="0" /> <edge from-layer="3133" from-port="0" to-layer="3134" to-port="0" /> <edge from-layer="3134" from-port="1" to-layer="3148" to-port="0" /> <edge from-layer="3135" from-port="0" to-layer="3136" to-port="0" /> <edge from-layer="3136" from-port="1" to-layer="3146" to-port="0" /> <edge from-layer="3137" from-port="0" to-layer="3138" to-port="0" /> <edge from-layer="3138" from-port="1" to-layer="3139" to-port="1" /> <edge from-layer="3139" from-port="2" to-layer="3141" to-port="0" /> <edge from-layer="3140" from-port="0" to-layer="3141" to-port="1" /> <edge from-layer="3141" from-port="2" to-layer="3144" to-port="0" /> <edge from-layer="3142" from-port="0" to-layer="3143" to-port="0" /> <edge from-layer="3143" from-port="1" to-layer="3144" to-port="1" /> <edge from-layer="3144" from-port="2" to-layer="3145" to-port="0" /> <edge from-layer="3145" from-port="1" to-layer="3146" to-port="1" /> <edge from-layer="3146" from-port="2" to-layer="3147" to-port="1" /> <edge from-layer="3147" from-port="2" to-layer="3148" to-port="1" /> <edge from-layer="3148" from-port="2" to-layer="3151" to-port="0" /> <edge from-layer="3149" from-port="0" to-layer="3150" to-port="0" /> <edge from-layer="3150" from-port="1" to-layer="3151" to-port="1" /> <edge from-layer="3151" from-port="2" to-layer="3152" to-port="0" /> <edge from-layer="3152" from-port="3" to-layer="3153" to-port="0" /> <edge from-layer="3152" from-port="4" to-layer="3154" to-port="0" /> <edge from-layer="3153" from-port="1" to-layer="3154" to-port="1" /> <edge from-layer="3154" from-port="2" to-layer="3157" to-port="0" /> <edge from-layer="3155" from-port="0" to-layer="3156" to-port="0" /> <edge from-layer="3156" from-port="1" to-layer="3157" to-port="1" /> <edge from-layer="3157" from-port="2" to-layer="3158" to-port="1" /> <edge from-layer="3158" from-port="2" to-layer="3262" to-port="0" /> <edge from-layer="3158" from-port="2" to-layer="3173" to-port="0" /> <edge from-layer="3158" from-port="2" to-layer="3165" to-port="0" /> <edge from-layer="3159" from-port="0" to-layer="3160" to-port="0" /> <edge from-layer="3160" from-port="1" to-layer="3174" to-port="0" /> <edge from-layer="3161" from-port="0" to-layer="3162" to-port="0" /> <edge from-layer="3162" from-port="1" to-layer="3172" to-port="0" /> <edge from-layer="3163" from-port="0" to-layer="3164" to-port="0" /> <edge from-layer="3164" from-port="1" to-layer="3165" to-port="1" /> <edge from-layer="3165" from-port="2" to-layer="3167" to-port="0" /> <edge from-layer="3166" from-port="0" to-layer="3167" to-port="1" /> <edge from-layer="3167" from-port="2" to-layer="3170" to-port="0" /> <edge from-layer="3168" from-port="0" to-layer="3169" to-port="0" /> <edge from-layer="3169" from-port="1" to-layer="3170" to-port="1" /> <edge from-layer="3170" from-port="2" to-layer="3171" to-port="0" /> <edge from-layer="3171" from-port="1" to-layer="3172" to-port="1" /> <edge from-layer="3172" from-port="2" to-layer="3173" to-port="1" /> <edge from-layer="3173" from-port="2" to-layer="3174" to-port="1" /> <edge from-layer="3174" from-port="2" to-layer="3177" to-port="0" /> <edge from-layer="3175" from-port="0" to-layer="3176" to-port="0" /> <edge from-layer="3176" from-port="1" to-layer="3177" to-port="1" /> <edge from-layer="3177" from-port="2" to-layer="3248" to-port="0" /> <edge from-layer="3177" from-port="2" to-layer="3181" to-port="0" /> <edge from-layer="3177" from-port="2" to-layer="3214" to-port="0" /> <edge from-layer="3178" from-port="0" to-layer="3181" to-port="1" /> <edge from-layer="3179" from-port="0" to-layer="3181" to-port="2" /> <edge from-layer="3180" from-port="0" to-layer="3181" to-port="3" /> <edge from-layer="3181" from-port="5" to-layer="3183" to-port="0" /> <edge from-layer="3182" from-port="0" to-layer="3183" to-port="1" /> <edge from-layer="3183" from-port="2" to-layer="3185" to-port="0" /> <edge from-layer="3184" from-port="0" to-layer="3185" to-port="1" /> <edge from-layer="3185" from-port="2" to-layer="3197" to-port="0" /> <edge from-layer="3185" from-port="2" to-layer="3186" to-port="0" /> <edge from-layer="3185" from-port="2" to-layer="3190" to-port="0" /> <edge from-layer="3186" from-port="2" to-layer="3200" to-port="0" /> <edge from-layer="3187" from-port="0" to-layer="3190" to-port="1" /> <edge from-layer="3188" from-port="0" to-layer="3190" to-port="2" /> <edge from-layer="3189" from-port="0" to-layer="3190" to-port="3" /> <edge from-layer="3190" from-port="5" to-layer="3193" to-port="0" /> <edge from-layer="3191" from-port="0" to-layer="3192" to-port="0" /> <edge from-layer="3192" from-port="1" to-layer="3193" to-port="1" /> <edge from-layer="3193" from-port="2" to-layer="3198" to-port="0" /> <edge from-layer="3194" from-port="0" to-layer="3197" to-port="1" /> <edge from-layer="3195" from-port="0" to-layer="3197" to-port="2" /> <edge from-layer="3196" from-port="0" to-layer="3197" to-port="3" /> <edge from-layer="3197" from-port="5" to-layer="3198" to-port="1" /> <edge from-layer="3198" from-port="2" to-layer="3199" to-port="0" /> <edge from-layer="3199" from-port="2" to-layer="3200" to-port="1" /> <edge from-layer="3200" from-port="2" to-layer="3254" to-port="0" /> <edge from-layer="3201" from-port="0" to-layer="3202" to-port="0" /> <edge from-layer="3202" from-port="1" to-layer="3207" to-port="0" /> <edge from-layer="3203" from-port="0" to-layer="3206" to-port="1" /> <edge from-layer="3204" from-port="0" to-layer="3206" to-port="2" /> <edge from-layer="3205" from-port="0" to-layer="3206" to-port="3" /> <edge from-layer="3206" from-port="4" to-layer="3207" to-port="1" /> <edge from-layer="3207" from-port="2" to-layer="3208" to-port="0" /> <edge from-layer="3208" from-port="1" to-layer="3210" to-port="0" /> <edge from-layer="3209" from-port="0" to-layer="3210" to-port="2" /> <edge from-layer="3210" from-port="3" to-layer="3234" to-port="0" /> <edge from-layer="3211" from-port="0" to-layer="3214" to-port="1" /> <edge from-layer="3212" from-port="0" to-layer="3214" to-port="2" /> <edge from-layer="3213" from-port="0" to-layer="3214" to-port="3" /> <edge from-layer="3214" from-port="5" to-layer="3216" to-port="0" /> <edge from-layer="3215" from-port="0" to-layer="3216" to-port="1" /> <edge from-layer="3216" from-port="2" to-layer="3218" to-port="0" /> <edge from-layer="3217" from-port="0" to-layer="3218" to-port="1" /> <edge from-layer="3218" from-port="2" to-layer="3223" to-port="0" /> <edge from-layer="3218" from-port="2" to-layer="3219" to-port="0" /> <edge from-layer="3218" from-port="2" to-layer="3230" to-port="0" /> <edge from-layer="3219" from-port="2" to-layer="3233" to-port="0" /> <edge from-layer="3220" from-port="0" to-layer="3223" to-port="1" /> <edge from-layer="3221" from-port="0" to-layer="3223" to-port="2" /> <edge from-layer="3222" from-port="0" to-layer="3223" to-port="3" /> <edge from-layer="3223" from-port="5" to-layer="3226" to-port="0" /> <edge from-layer="3224" from-port="0" to-layer="3225" to-port="0" /> <edge from-layer="3225" from-port="1" to-layer="3226" to-port="1" /> <edge from-layer="3226" from-port="2" to-layer="3231" to-port="0" /> <edge from-layer="3227" from-port="0" to-layer="3230" to-port="1" /> <edge from-layer="3228" from-port="0" to-layer="3230" to-port="2" /> <edge from-layer="3229" from-port="0" to-layer="3230" to-port="3" /> <edge from-layer="3230" from-port="5" to-layer="3231" to-port="1" /> <edge from-layer="3231" from-port="2" to-layer="3232" to-port="0" /> <edge from-layer="3232" from-port="2" to-layer="3233" to-port="1" /> <edge from-layer="3233" from-port="2" to-layer="3234" to-port="1" /> <edge from-layer="3234" from-port="2" to-layer="4278" to-port="0" /> <edge from-layer="3234" from-port="2" to-layer="3254" to-port="1" /> <edge from-layer="3235" from-port="0" to-layer="3236" to-port="0" /> <edge from-layer="3236" from-port="1" to-layer="3241" to-port="0" /> <edge from-layer="3237" from-port="0" to-layer="3240" to-port="1" /> <edge from-layer="3238" from-port="0" to-layer="3240" to-port="2" /> <edge from-layer="3239" from-port="0" to-layer="3240" to-port="3" /> <edge from-layer="3240" from-port="4" to-layer="3241" to-port="1" /> <edge from-layer="3241" from-port="2" to-layer="3242" to-port="0" /> <edge from-layer="3242" from-port="1" to-layer="3244" to-port="0" /> <edge from-layer="3243" from-port="0" to-layer="3244" to-port="2" /> <edge from-layer="3244" from-port="3" to-layer="3253" to-port="0" /> <edge from-layer="3245" from-port="0" to-layer="3248" to-port="1" /> <edge from-layer="3246" from-port="0" to-layer="3248" to-port="2" /> <edge from-layer="3247" from-port="0" to-layer="3248" to-port="3" /> <edge from-layer="3248" from-port="5" to-layer="3250" to-port="0" /> <edge from-layer="3249" from-port="0" to-layer="3250" to-port="1" /> <edge from-layer="3250" from-port="2" to-layer="3252" to-port="0" /> <edge from-layer="3251" from-port="0" to-layer="3252" to-port="1" /> <edge from-layer="3252" from-port="2" to-layer="3253" to-port="1" /> <edge from-layer="3253" from-port="2" to-layer="4277" to-port="0" /> <edge from-layer="3253" from-port="2" to-layer="3254" to-port="2" /> <edge from-layer="3254" from-port="4" to-layer="3256" to-port="0" /> <edge from-layer="3255" from-port="0" to-layer="3256" to-port="1" /> <edge from-layer="3256" from-port="2" to-layer="3258" to-port="0" /> <edge from-layer="3257" from-port="0" to-layer="3258" to-port="1" /> <edge from-layer="3258" from-port="2" to-layer="3261" to-port="0" /> <edge from-layer="3259" from-port="0" to-layer="3260" to-port="0" /> <edge from-layer="3260" from-port="1" to-layer="3261" to-port="1" /> <edge from-layer="3261" from-port="2" to-layer="3262" to-port="1" /> <edge from-layer="3262" from-port="2" to-layer="3269" to-port="0" /> <edge from-layer="3262" from-port="2" to-layer="3288" to-port="0" /> <edge from-layer="3262" from-port="2" to-layer="3277" to-port="0" /> <edge from-layer="3263" from-port="0" to-layer="3264" to-port="0" /> <edge from-layer="3264" from-port="1" to-layer="3278" to-port="0" /> <edge from-layer="3265" from-port="0" to-layer="3266" to-port="0" /> <edge from-layer="3266" from-port="1" to-layer="3276" to-port="0" /> <edge from-layer="3267" from-port="0" to-layer="3268" to-port="0" /> <edge from-layer="3268" from-port="1" to-layer="3269" to-port="1" /> <edge from-layer="3269" from-port="2" to-layer="3271" to-port="0" /> <edge from-layer="3270" from-port="0" to-layer="3271" to-port="1" /> <edge from-layer="3271" from-port="2" to-layer="3274" to-port="0" /> <edge from-layer="3272" from-port="0" to-layer="3273" to-port="0" /> <edge from-layer="3273" from-port="1" to-layer="3274" to-port="1" /> <edge from-layer="3274" from-port="2" to-layer="3275" to-port="0" /> <edge from-layer="3275" from-port="1" to-layer="3276" to-port="1" /> <edge from-layer="3276" from-port="2" to-layer="3277" to-port="1" /> <edge from-layer="3277" from-port="2" to-layer="3278" to-port="1" /> <edge from-layer="3278" from-port="2" to-layer="3281" to-port="0" /> <edge from-layer="3279" from-port="0" to-layer="3280" to-port="0" /> <edge from-layer="3280" from-port="1" to-layer="3281" to-port="1" /> <edge from-layer="3281" from-port="2" to-layer="3282" to-port="0" /> <edge from-layer="3282" from-port="4" to-layer="3284" to-port="0" /> <edge from-layer="3282" from-port="3" to-layer="3283" to-port="0" /> <edge from-layer="3283" from-port="1" to-layer="3284" to-port="1" /> <edge from-layer="3284" from-port="2" to-layer="3287" to-port="0" /> <edge from-layer="3285" from-port="0" to-layer="3286" to-port="0" /> <edge from-layer="3286" from-port="1" to-layer="3287" to-port="1" /> <edge from-layer="3287" from-port="2" to-layer="3288" to-port="1" /> <edge from-layer="3288" from-port="2" to-layer="3392" to-port="0" /> <edge from-layer="3288" from-port="2" to-layer="3303" to-port="0" /> <edge from-layer="3288" from-port="2" to-layer="3295" to-port="0" /> <edge from-layer="3289" from-port="0" to-layer="3290" to-port="0" /> <edge from-layer="3290" from-port="1" to-layer="3304" to-port="0" /> <edge from-layer="3291" from-port="0" to-layer="3292" to-port="0" /> <edge from-layer="3292" from-port="1" to-layer="3302" to-port="0" /> <edge from-layer="3293" from-port="0" to-layer="3294" to-port="0" /> <edge from-layer="3294" from-port="1" to-layer="3295" to-port="1" /> <edge from-layer="3295" from-port="2" to-layer="3297" to-port="0" /> <edge from-layer="3296" from-port="0" to-layer="3297" to-port="1" /> <edge from-layer="3297" from-port="2" to-layer="3300" to-port="0" /> <edge from-layer="3298" from-port="0" to-layer="3299" to-port="0" /> <edge from-layer="3299" from-port="1" to-layer="3300" to-port="1" /> <edge from-layer="3300" from-port="2" to-layer="3301" to-port="0" /> <edge from-layer="3301" from-port="1" to-layer="3302" to-port="1" /> <edge from-layer="3302" from-port="2" to-layer="3303" to-port="1" /> <edge from-layer="3303" from-port="2" to-layer="3304" to-port="1" /> <edge from-layer="3304" from-port="2" to-layer="3307" to-port="0" /> <edge from-layer="3305" from-port="0" to-layer="3306" to-port="0" /> <edge from-layer="3306" from-port="1" to-layer="3307" to-port="1" /> <edge from-layer="3307" from-port="2" to-layer="3311" to-port="0" /> <edge from-layer="3307" from-port="2" to-layer="3344" to-port="0" /> <edge from-layer="3307" from-port="2" to-layer="3378" to-port="0" /> <edge from-layer="3308" from-port="0" to-layer="3311" to-port="1" /> <edge from-layer="3309" from-port="0" to-layer="3311" to-port="2" /> <edge from-layer="3310" from-port="0" to-layer="3311" to-port="3" /> <edge from-layer="3311" from-port="5" to-layer="3313" to-port="0" /> <edge from-layer="3312" from-port="0" to-layer="3313" to-port="1" /> <edge from-layer="3313" from-port="2" to-layer="3315" to-port="0" /> <edge from-layer="3314" from-port="0" to-layer="3315" to-port="1" /> <edge from-layer="3315" from-port="2" to-layer="3327" to-port="0" /> <edge from-layer="3315" from-port="2" to-layer="3316" to-port="0" /> <edge from-layer="3315" from-port="2" to-layer="3320" to-port="0" /> <edge from-layer="3316" from-port="2" to-layer="3330" to-port="0" /> <edge from-layer="3317" from-port="0" to-layer="3320" to-port="1" /> <edge from-layer="3318" from-port="0" to-layer="3320" to-port="2" /> <edge from-layer="3319" from-port="0" to-layer="3320" to-port="3" /> <edge from-layer="3320" from-port="5" to-layer="3323" to-port="0" /> <edge from-layer="3321" from-port="0" to-layer="3322" to-port="0" /> <edge from-layer="3322" from-port="1" to-layer="3323" to-port="1" /> <edge from-layer="3323" from-port="2" to-layer="3328" to-port="0" /> <edge from-layer="3324" from-port="0" to-layer="3327" to-port="1" /> <edge from-layer="3325" from-port="0" to-layer="3327" to-port="2" /> <edge from-layer="3326" from-port="0" to-layer="3327" to-port="3" /> <edge from-layer="3327" from-port="5" to-layer="3328" to-port="1" /> <edge from-layer="3328" from-port="2" to-layer="3329" to-port="0" /> <edge from-layer="3329" from-port="2" to-layer="3330" to-port="1" /> <edge from-layer="3330" from-port="2" to-layer="3384" to-port="0" /> <edge from-layer="3331" from-port="0" to-layer="3332" to-port="0" /> <edge from-layer="3332" from-port="1" to-layer="3337" to-port="0" /> <edge from-layer="3333" from-port="0" to-layer="3336" to-port="1" /> <edge from-layer="3334" from-port="0" to-layer="3336" to-port="2" /> <edge from-layer="3335" from-port="0" to-layer="3336" to-port="3" /> <edge from-layer="3336" from-port="4" to-layer="3337" to-port="1" /> <edge from-layer="3337" from-port="2" to-layer="3338" to-port="0" /> <edge from-layer="3338" from-port="1" to-layer="3340" to-port="0" /> <edge from-layer="3339" from-port="0" to-layer="3340" to-port="2" /> <edge from-layer="3340" from-port="3" to-layer="3364" to-port="0" /> <edge from-layer="3341" from-port="0" to-layer="3344" to-port="1" /> <edge from-layer="3342" from-port="0" to-layer="3344" to-port="2" /> <edge from-layer="3343" from-port="0" to-layer="3344" to-port="3" /> <edge from-layer="3344" from-port="5" to-layer="3346" to-port="0" /> <edge from-layer="3345" from-port="0" to-layer="3346" to-port="1" /> <edge from-layer="3346" from-port="2" to-layer="3348" to-port="0" /> <edge from-layer="3347" from-port="0" to-layer="3348" to-port="1" /> <edge from-layer="3348" from-port="2" to-layer="3360" to-port="0" /> <edge from-layer="3348" from-port="2" to-layer="3349" to-port="0" /> <edge from-layer="3348" from-port="2" to-layer="3353" to-port="0" /> <edge from-layer="3349" from-port="2" to-layer="3363" to-port="0" /> <edge from-layer="3350" from-port="0" to-layer="3353" to-port="1" /> <edge from-layer="3351" from-port="0" to-layer="3353" to-port="2" /> <edge from-layer="3352" from-port="0" to-layer="3353" to-port="3" /> <edge from-layer="3353" from-port="5" to-layer="3356" to-port="0" /> <edge from-layer="3354" from-port="0" to-layer="3355" to-port="0" /> <edge from-layer="3355" from-port="1" to-layer="3356" to-port="1" /> <edge from-layer="3356" from-port="2" to-layer="3361" to-port="0" /> <edge from-layer="3357" from-port="0" to-layer="3360" to-port="1" /> <edge from-layer="3358" from-port="0" to-layer="3360" to-port="2" /> <edge from-layer="3359" from-port="0" to-layer="3360" to-port="3" /> <edge from-layer="3360" from-port="5" to-layer="3361" to-port="1" /> <edge from-layer="3361" from-port="2" to-layer="3362" to-port="0" /> <edge from-layer="3362" from-port="2" to-layer="3363" to-port="1" /> <edge from-layer="3363" from-port="2" to-layer="3364" to-port="1" /> <edge from-layer="3364" from-port="2" to-layer="4276" to-port="0" /> <edge from-layer="3364" from-port="2" to-layer="3384" to-port="1" /> <edge from-layer="3365" from-port="0" to-layer="3366" to-port="0" /> <edge from-layer="3366" from-port="1" to-layer="3371" to-port="0" /> <edge from-layer="3367" from-port="0" to-layer="3370" to-port="1" /> <edge from-layer="3368" from-port="0" to-layer="3370" to-port="2" /> <edge from-layer="3369" from-port="0" to-layer="3370" to-port="3" /> <edge from-layer="3370" from-port="4" to-layer="3371" to-port="1" /> <edge from-layer="3371" from-port="2" to-layer="3372" to-port="0" /> <edge from-layer="3372" from-port="1" to-layer="3374" to-port="0" /> <edge from-layer="3373" from-port="0" to-layer="3374" to-port="2" /> <edge from-layer="3374" from-port="3" to-layer="3383" to-port="0" /> <edge from-layer="3375" from-port="0" to-layer="3378" to-port="1" /> <edge from-layer="3376" from-port="0" to-layer="3378" to-port="2" /> <edge from-layer="3377" from-port="0" to-layer="3378" to-port="3" /> <edge from-layer="3378" from-port="5" to-layer="3380" to-port="0" /> <edge from-layer="3379" from-port="0" to-layer="3380" to-port="1" /> <edge from-layer="3380" from-port="2" to-layer="3382" to-port="0" /> <edge from-layer="3381" from-port="0" to-layer="3382" to-port="1" /> <edge from-layer="3382" from-port="2" to-layer="3383" to-port="1" /> <edge from-layer="3383" from-port="2" to-layer="4275" to-port="0" /> <edge from-layer="3383" from-port="2" to-layer="3384" to-port="2" /> <edge from-layer="3384" from-port="4" to-layer="3386" to-port="0" /> <edge from-layer="3385" from-port="0" to-layer="3386" to-port="1" /> <edge from-layer="3386" from-port="2" to-layer="3388" to-port="0" /> <edge from-layer="3387" from-port="0" to-layer="3388" to-port="1" /> <edge from-layer="3388" from-port="2" to-layer="3391" to-port="0" /> <edge from-layer="3389" from-port="0" to-layer="3390" to-port="0" /> <edge from-layer="3390" from-port="1" to-layer="3391" to-port="1" /> <edge from-layer="3391" from-port="2" to-layer="3392" to-port="1" /> <edge from-layer="3392" from-port="2" to-layer="3418" to-port="0" /> <edge from-layer="3392" from-port="2" to-layer="3399" to-port="0" /> <edge from-layer="3392" from-port="2" to-layer="3407" to-port="0" /> <edge from-layer="3393" from-port="0" to-layer="3394" to-port="0" /> <edge from-layer="3394" from-port="1" to-layer="3408" to-port="0" /> <edge from-layer="3395" from-port="0" to-layer="3396" to-port="0" /> <edge from-layer="3396" from-port="1" to-layer="3406" to-port="0" /> <edge from-layer="3397" from-port="0" to-layer="3398" to-port="0" /> <edge from-layer="3398" from-port="1" to-layer="3399" to-port="1" /> <edge from-layer="3399" from-port="2" to-layer="3401" to-port="0" /> <edge from-layer="3400" from-port="0" to-layer="3401" to-port="1" /> <edge from-layer="3401" from-port="2" to-layer="3404" to-port="0" /> <edge from-layer="3402" from-port="0" to-layer="3403" to-port="0" /> <edge from-layer="3403" from-port="1" to-layer="3404" to-port="1" /> <edge from-layer="3404" from-port="2" to-layer="3405" to-port="0" /> <edge from-layer="3405" from-port="1" to-layer="3406" to-port="1" /> <edge from-layer="3406" from-port="2" to-layer="3407" to-port="1" /> <edge from-layer="3407" from-port="2" to-layer="3408" to-port="1" /> <edge from-layer="3408" from-port="2" to-layer="3411" to-port="0" /> <edge from-layer="3409" from-port="0" to-layer="3410" to-port="0" /> <edge from-layer="3410" from-port="1" to-layer="3411" to-port="1" /> <edge from-layer="3411" from-port="2" to-layer="3412" to-port="0" /> <edge from-layer="3412" from-port="3" to-layer="3413" to-port="0" /> <edge from-layer="3412" from-port="4" to-layer="3414" to-port="0" /> <edge from-layer="3413" from-port="1" to-layer="3414" to-port="1" /> <edge from-layer="3414" from-port="2" to-layer="3417" to-port="0" /> <edge from-layer="3415" from-port="0" to-layer="3416" to-port="0" /> <edge from-layer="3416" from-port="1" to-layer="3417" to-port="1" /> <edge from-layer="3417" from-port="2" to-layer="3418" to-port="1" /> <edge from-layer="3418" from-port="2" to-layer="3522" to-port="0" /> <edge from-layer="3418" from-port="2" to-layer="3433" to-port="0" /> <edge from-layer="3418" from-port="2" to-layer="3425" to-port="0" /> <edge from-layer="3419" from-port="0" to-layer="3420" to-port="0" /> <edge from-layer="3420" from-port="1" to-layer="3434" to-port="0" /> <edge from-layer="3421" from-port="0" to-layer="3422" to-port="0" /> <edge from-layer="3422" from-port="1" to-layer="3432" to-port="0" /> <edge from-layer="3423" from-port="0" to-layer="3424" to-port="0" /> <edge from-layer="3424" from-port="1" to-layer="3425" to-port="1" /> <edge from-layer="3425" from-port="2" to-layer="3427" to-port="0" /> <edge from-layer="3426" from-port="0" to-layer="3427" to-port="1" /> <edge from-layer="3427" from-port="2" to-layer="3430" to-port="0" /> <edge from-layer="3428" from-port="0" to-layer="3429" to-port="0" /> <edge from-layer="3429" from-port="1" to-layer="3430" to-port="1" /> <edge from-layer="3430" from-port="2" to-layer="3431" to-port="0" /> <edge from-layer="3431" from-port="1" to-layer="3432" to-port="1" /> <edge from-layer="3432" from-port="2" to-layer="3433" to-port="1" /> <edge from-layer="3433" from-port="2" to-layer="3434" to-port="1" /> <edge from-layer="3434" from-port="2" to-layer="3437" to-port="0" /> <edge from-layer="3435" from-port="0" to-layer="3436" to-port="0" /> <edge from-layer="3436" from-port="1" to-layer="3437" to-port="1" /> <edge from-layer="3437" from-port="2" to-layer="3441" to-port="0" /> <edge from-layer="3437" from-port="2" to-layer="3508" to-port="0" /> <edge from-layer="3437" from-port="2" to-layer="3474" to-port="0" /> <edge from-layer="3438" from-port="0" to-layer="3441" to-port="1" /> <edge from-layer="3439" from-port="0" to-layer="3441" to-port="2" /> <edge from-layer="3440" from-port="0" to-layer="3441" to-port="3" /> <edge from-layer="3441" from-port="5" to-layer="3443" to-port="0" /> <edge from-layer="3442" from-port="0" to-layer="3443" to-port="1" /> <edge from-layer="3443" from-port="2" to-layer="3445" to-port="0" /> <edge from-layer="3444" from-port="0" to-layer="3445" to-port="1" /> <edge from-layer="3445" from-port="2" to-layer="3457" to-port="0" /> <edge from-layer="3445" from-port="2" to-layer="3446" to-port="0" /> <edge from-layer="3445" from-port="2" to-layer="3450" to-port="0" /> <edge from-layer="3446" from-port="2" to-layer="3460" to-port="0" /> <edge from-layer="3447" from-port="0" to-layer="3450" to-port="1" /> <edge from-layer="3448" from-port="0" to-layer="3450" to-port="2" /> <edge from-layer="3449" from-port="0" to-layer="3450" to-port="3" /> <edge from-layer="3450" from-port="5" to-layer="3453" to-port="0" /> <edge from-layer="3451" from-port="0" to-layer="3452" to-port="0" /> <edge from-layer="3452" from-port="1" to-layer="3453" to-port="1" /> <edge from-layer="3453" from-port="2" to-layer="3458" to-port="0" /> <edge from-layer="3454" from-port="0" to-layer="3457" to-port="1" /> <edge from-layer="3455" from-port="0" to-layer="3457" to-port="2" /> <edge from-layer="3456" from-port="0" to-layer="3457" to-port="3" /> <edge from-layer="3457" from-port="5" to-layer="3458" to-port="1" /> <edge from-layer="3458" from-port="2" to-layer="3459" to-port="0" /> <edge from-layer="3459" from-port="2" to-layer="3460" to-port="1" /> <edge from-layer="3460" from-port="2" to-layer="3514" to-port="0" /> <edge from-layer="3461" from-port="0" to-layer="3462" to-port="0" /> <edge from-layer="3462" from-port="1" to-layer="3467" to-port="0" /> <edge from-layer="3463" from-port="0" to-layer="3466" to-port="1" /> <edge from-layer="3464" from-port="0" to-layer="3466" to-port="2" /> <edge from-layer="3465" from-port="0" to-layer="3466" to-port="3" /> <edge from-layer="3466" from-port="4" to-layer="3467" to-port="1" /> <edge from-layer="3467" from-port="2" to-layer="3468" to-port="0" /> <edge from-layer="3468" from-port="1" to-layer="3470" to-port="0" /> <edge from-layer="3469" from-port="0" to-layer="3470" to-port="2" /> <edge from-layer="3470" from-port="3" to-layer="3494" to-port="0" /> <edge from-layer="3471" from-port="0" to-layer="3474" to-port="1" /> <edge from-layer="3472" from-port="0" to-layer="3474" to-port="2" /> <edge from-layer="3473" from-port="0" to-layer="3474" to-port="3" /> <edge from-layer="3474" from-port="5" to-layer="3476" to-port="0" /> <edge from-layer="3475" from-port="0" to-layer="3476" to-port="1" /> <edge from-layer="3476" from-port="2" to-layer="3478" to-port="0" /> <edge from-layer="3477" from-port="0" to-layer="3478" to-port="1" /> <edge from-layer="3478" from-port="2" to-layer="3479" to-port="0" /> <edge from-layer="3478" from-port="2" to-layer="3483" to-port="0" /> <edge from-layer="3478" from-port="2" to-layer="3490" to-port="0" /> <edge from-layer="3479" from-port="2" to-layer="3493" to-port="0" /> <edge from-layer="3480" from-port="0" to-layer="3483" to-port="1" /> <edge from-layer="3481" from-port="0" to-layer="3483" to-port="2" /> <edge from-layer="3482" from-port="0" to-layer="3483" to-port="3" /> <edge from-layer="3483" from-port="5" to-layer="3486" to-port="0" /> <edge from-layer="3484" from-port="0" to-layer="3485" to-port="0" /> <edge from-layer="3485" from-port="1" to-layer="3486" to-port="1" /> <edge from-layer="3486" from-port="2" to-layer="3491" to-port="0" /> <edge from-layer="3487" from-port="0" to-layer="3490" to-port="1" /> <edge from-layer="3488" from-port="0" to-layer="3490" to-port="2" /> <edge from-layer="3489" from-port="0" to-layer="3490" to-port="3" /> <edge from-layer="3490" from-port="5" to-layer="3491" to-port="1" /> <edge from-layer="3491" from-port="2" to-layer="3492" to-port="0" /> <edge from-layer="3492" from-port="2" to-layer="3493" to-port="1" /> <edge from-layer="3493" from-port="2" to-layer="3494" to-port="1" /> <edge from-layer="3494" from-port="2" to-layer="4274" to-port="0" /> <edge from-layer="3494" from-port="2" to-layer="3514" to-port="1" /> <edge from-layer="3495" from-port="0" to-layer="3496" to-port="0" /> <edge from-layer="3496" from-port="1" to-layer="3501" to-port="0" /> <edge from-layer="3497" from-port="0" to-layer="3500" to-port="1" /> <edge from-layer="3498" from-port="0" to-layer="3500" to-port="2" /> <edge from-layer="3499" from-port="0" to-layer="3500" to-port="3" /> <edge from-layer="3500" from-port="4" to-layer="3501" to-port="1" /> <edge from-layer="3501" from-port="2" to-layer="3502" to-port="0" /> <edge from-layer="3502" from-port="1" to-layer="3504" to-port="0" /> <edge from-layer="3503" from-port="0" to-layer="3504" to-port="2" /> <edge from-layer="3504" from-port="3" to-layer="3513" to-port="0" /> <edge from-layer="3505" from-port="0" to-layer="3508" to-port="1" /> <edge from-layer="3506" from-port="0" to-layer="3508" to-port="2" /> <edge from-layer="3507" from-port="0" to-layer="3508" to-port="3" /> <edge from-layer="3508" from-port="5" to-layer="3510" to-port="0" /> <edge from-layer="3509" from-port="0" to-layer="3510" to-port="1" /> <edge from-layer="3510" from-port="2" to-layer="3512" to-port="0" /> <edge from-layer="3511" from-port="0" to-layer="3512" to-port="1" /> <edge from-layer="3512" from-port="2" to-layer="3513" to-port="1" /> <edge from-layer="3513" from-port="2" to-layer="4273" to-port="0" /> <edge from-layer="3513" from-port="2" to-layer="3514" to-port="2" /> <edge from-layer="3514" from-port="4" to-layer="3516" to-port="0" /> <edge from-layer="3515" from-port="0" to-layer="3516" to-port="1" /> <edge from-layer="3516" from-port="2" to-layer="3518" to-port="0" /> <edge from-layer="3517" from-port="0" to-layer="3518" to-port="1" /> <edge from-layer="3518" from-port="2" to-layer="3521" to-port="0" /> <edge from-layer="3519" from-port="0" to-layer="3520" to-port="0" /> <edge from-layer="3520" from-port="1" to-layer="3521" to-port="1" /> <edge from-layer="3521" from-port="2" to-layer="3522" to-port="1" /> <edge from-layer="3522" from-port="2" to-layer="3548" to-port="0" /> <edge from-layer="3522" from-port="2" to-layer="3529" to-port="0" /> <edge from-layer="3522" from-port="2" to-layer="3537" to-port="0" /> <edge from-layer="3523" from-port="0" to-layer="3524" to-port="0" /> <edge from-layer="3524" from-port="1" to-layer="3538" to-port="0" /> <edge from-layer="3525" from-port="0" to-layer="3526" to-port="0" /> <edge from-layer="3526" from-port="1" to-layer="3536" to-port="0" /> <edge from-layer="3527" from-port="0" to-layer="3528" to-port="0" /> <edge from-layer="3528" from-port="1" to-layer="3529" to-port="1" /> <edge from-layer="3529" from-port="2" to-layer="3531" to-port="0" /> <edge from-layer="3530" from-port="0" to-layer="3531" to-port="1" /> <edge from-layer="3531" from-port="2" to-layer="3534" to-port="0" /> <edge from-layer="3532" from-port="0" to-layer="3533" to-port="0" /> <edge from-layer="3533" from-port="1" to-layer="3534" to-port="1" /> <edge from-layer="3534" from-port="2" to-layer="3535" to-port="0" /> <edge from-layer="3535" from-port="1" to-layer="3536" to-port="1" /> <edge from-layer="3536" from-port="2" to-layer="3537" to-port="1" /> <edge from-layer="3537" from-port="2" to-layer="3538" to-port="1" /> <edge from-layer="3538" from-port="2" to-layer="3541" to-port="0" /> <edge from-layer="3539" from-port="0" to-layer="3540" to-port="0" /> <edge from-layer="3540" from-port="1" to-layer="3541" to-port="1" /> <edge from-layer="3541" from-port="2" to-layer="3542" to-port="0" /> <edge from-layer="3542" from-port="4" to-layer="3544" to-port="0" /> <edge from-layer="3542" from-port="3" to-layer="3543" to-port="0" /> <edge from-layer="3543" from-port="1" to-layer="3544" to-port="1" /> <edge from-layer="3544" from-port="2" to-layer="3547" to-port="0" /> <edge from-layer="3545" from-port="0" to-layer="3546" to-port="0" /> <edge from-layer="3546" from-port="1" to-layer="3547" to-port="1" /> <edge from-layer="3547" from-port="2" to-layer="3548" to-port="1" /> <edge from-layer="3548" from-port="2" to-layer="3555" to-port="0" /> <edge from-layer="3548" from-port="2" to-layer="3563" to-port="0" /> <edge from-layer="3548" from-port="2" to-layer="3652" to-port="0" /> <edge from-layer="3549" from-port="0" to-layer="3550" to-port="0" /> <edge from-layer="3550" from-port="1" to-layer="3564" to-port="0" /> <edge from-layer="3551" from-port="0" to-layer="3552" to-port="0" /> <edge from-layer="3552" from-port="1" to-layer="3562" to-port="0" /> <edge from-layer="3553" from-port="0" to-layer="3554" to-port="0" /> <edge from-layer="3554" from-port="1" to-layer="3555" to-port="1" /> <edge from-layer="3555" from-port="2" to-layer="3557" to-port="0" /> <edge from-layer="3556" from-port="0" to-layer="3557" to-port="1" /> <edge from-layer="3557" from-port="2" to-layer="3560" to-port="0" /> <edge from-layer="3558" from-port="0" to-layer="3559" to-port="0" /> <edge from-layer="3559" from-port="1" to-layer="3560" to-port="1" /> <edge from-layer="3560" from-port="2" to-layer="3561" to-port="0" /> <edge from-layer="3561" from-port="1" to-layer="3562" to-port="1" /> <edge from-layer="3562" from-port="2" to-layer="3563" to-port="1" /> <edge from-layer="3563" from-port="2" to-layer="3564" to-port="1" /> <edge from-layer="3564" from-port="2" to-layer="3567" to-port="0" /> <edge from-layer="3565" from-port="0" to-layer="3566" to-port="0" /> <edge from-layer="3566" from-port="1" to-layer="3567" to-port="1" /> <edge from-layer="3567" from-port="2" to-layer="3571" to-port="0" /> <edge from-layer="3567" from-port="2" to-layer="3604" to-port="0" /> <edge from-layer="3567" from-port="2" to-layer="3638" to-port="0" /> <edge from-layer="3568" from-port="0" to-layer="3571" to-port="1" /> <edge from-layer="3569" from-port="0" to-layer="3571" to-port="2" /> <edge from-layer="3570" from-port="0" to-layer="3571" to-port="3" /> <edge from-layer="3571" from-port="5" to-layer="3573" to-port="0" /> <edge from-layer="3572" from-port="0" to-layer="3573" to-port="1" /> <edge from-layer="3573" from-port="2" to-layer="3575" to-port="0" /> <edge from-layer="3574" from-port="0" to-layer="3575" to-port="1" /> <edge from-layer="3575" from-port="2" to-layer="3576" to-port="0" /> <edge from-layer="3575" from-port="2" to-layer="3587" to-port="0" /> <edge from-layer="3575" from-port="2" to-layer="3580" to-port="0" /> <edge from-layer="3576" from-port="2" to-layer="3590" to-port="0" /> <edge from-layer="3577" from-port="0" to-layer="3580" to-port="1" /> <edge from-layer="3578" from-port="0" to-layer="3580" to-port="2" /> <edge from-layer="3579" from-port="0" to-layer="3580" to-port="3" /> <edge from-layer="3580" from-port="5" to-layer="3583" to-port="0" /> <edge from-layer="3581" from-port="0" to-layer="3582" to-port="0" /> <edge from-layer="3582" from-port="1" to-layer="3583" to-port="1" /> <edge from-layer="3583" from-port="2" to-layer="3588" to-port="0" /> <edge from-layer="3584" from-port="0" to-layer="3587" to-port="1" /> <edge from-layer="3585" from-port="0" to-layer="3587" to-port="2" /> <edge from-layer="3586" from-port="0" to-layer="3587" to-port="3" /> <edge from-layer="3587" from-port="5" to-layer="3588" to-port="1" /> <edge from-layer="3588" from-port="2" to-layer="3589" to-port="0" /> <edge from-layer="3589" from-port="2" to-layer="3590" to-port="1" /> <edge from-layer="3590" from-port="2" to-layer="3644" to-port="0" /> <edge from-layer="3591" from-port="0" to-layer="3592" to-port="0" /> <edge from-layer="3592" from-port="1" to-layer="3597" to-port="0" /> <edge from-layer="3593" from-port="0" to-layer="3596" to-port="1" /> <edge from-layer="3594" from-port="0" to-layer="3596" to-port="2" /> <edge from-layer="3595" from-port="0" to-layer="3596" to-port="3" /> <edge from-layer="3596" from-port="4" to-layer="3597" to-port="1" /> <edge from-layer="3597" from-port="2" to-layer="3598" to-port="0" /> <edge from-layer="3598" from-port="1" to-layer="3600" to-port="0" /> <edge from-layer="3599" from-port="0" to-layer="3600" to-port="2" /> <edge from-layer="3600" from-port="3" to-layer="3624" to-port="0" /> <edge from-layer="3601" from-port="0" to-layer="3604" to-port="1" /> <edge from-layer="3602" from-port="0" to-layer="3604" to-port="2" /> <edge from-layer="3603" from-port="0" to-layer="3604" to-port="3" /> <edge from-layer="3604" from-port="5" to-layer="3606" to-port="0" /> <edge from-layer="3605" from-port="0" to-layer="3606" to-port="1" /> <edge from-layer="3606" from-port="2" to-layer="3608" to-port="0" /> <edge from-layer="3607" from-port="0" to-layer="3608" to-port="1" /> <edge from-layer="3608" from-port="2" to-layer="3620" to-port="0" /> <edge from-layer="3608" from-port="2" to-layer="3609" to-port="0" /> <edge from-layer="3608" from-port="2" to-layer="3613" to-port="0" /> <edge from-layer="3609" from-port="2" to-layer="3623" to-port="0" /> <edge from-layer="3610" from-port="0" to-layer="3613" to-port="1" /> <edge from-layer="3611" from-port="0" to-layer="3613" to-port="2" /> <edge from-layer="3612" from-port="0" to-layer="3613" to-port="3" /> <edge from-layer="3613" from-port="5" to-layer="3616" to-port="0" /> <edge from-layer="3614" from-port="0" to-layer="3615" to-port="0" /> <edge from-layer="3615" from-port="1" to-layer="3616" to-port="1" /> <edge from-layer="3616" from-port="2" to-layer="3621" to-port="0" /> <edge from-layer="3617" from-port="0" to-layer="3620" to-port="1" /> <edge from-layer="3618" from-port="0" to-layer="3620" to-port="2" /> <edge from-layer="3619" from-port="0" to-layer="3620" to-port="3" /> <edge from-layer="3620" from-port="5" to-layer="3621" to-port="1" /> <edge from-layer="3621" from-port="2" to-layer="3622" to-port="0" /> <edge from-layer="3622" from-port="2" to-layer="3623" to-port="1" /> <edge from-layer="3623" from-port="2" to-layer="3624" to-port="1" /> <edge from-layer="3624" from-port="2" to-layer="3644" to-port="1" /> <edge from-layer="3624" from-port="2" to-layer="4272" to-port="0" /> <edge from-layer="3625" from-port="0" to-layer="3626" to-port="0" /> <edge from-layer="3626" from-port="1" to-layer="3631" to-port="0" /> <edge from-layer="3627" from-port="0" to-layer="3630" to-port="1" /> <edge from-layer="3628" from-port="0" to-layer="3630" to-port="2" /> <edge from-layer="3629" from-port="0" to-layer="3630" to-port="3" /> <edge from-layer="3630" from-port="4" to-layer="3631" to-port="1" /> <edge from-layer="3631" from-port="2" to-layer="3632" to-port="0" /> <edge from-layer="3632" from-port="1" to-layer="3634" to-port="0" /> <edge from-layer="3633" from-port="0" to-layer="3634" to-port="2" /> <edge from-layer="3634" from-port="3" to-layer="3643" to-port="0" /> <edge from-layer="3635" from-port="0" to-layer="3638" to-port="1" /> <edge from-layer="3636" from-port="0" to-layer="3638" to-port="2" /> <edge from-layer="3637" from-port="0" to-layer="3638" to-port="3" /> <edge from-layer="3638" from-port="5" to-layer="3640" to-port="0" /> <edge from-layer="3639" from-port="0" to-layer="3640" to-port="1" /> <edge from-layer="3640" from-port="2" to-layer="3642" to-port="0" /> <edge from-layer="3641" from-port="0" to-layer="3642" to-port="1" /> <edge from-layer="3642" from-port="2" to-layer="3643" to-port="1" /> <edge from-layer="3643" from-port="2" to-layer="3644" to-port="2" /> <edge from-layer="3643" from-port="2" to-layer="4271" to-port="0" /> <edge from-layer="3644" from-port="4" to-layer="3646" to-port="0" /> <edge from-layer="3645" from-port="0" to-layer="3646" to-port="1" /> <edge from-layer="3646" from-port="2" to-layer="3648" to-port="0" /> <edge from-layer="3647" from-port="0" to-layer="3648" to-port="1" /> <edge from-layer="3648" from-port="2" to-layer="3651" to-port="0" /> <edge from-layer="3649" from-port="0" to-layer="3650" to-port="0" /> <edge from-layer="3650" from-port="1" to-layer="3651" to-port="1" /> <edge from-layer="3651" from-port="2" to-layer="3652" to-port="1" /> <edge from-layer="3652" from-port="2" to-layer="3667" to-port="0" /> <edge from-layer="3652" from-port="2" to-layer="3678" to-port="0" /> <edge from-layer="3652" from-port="2" to-layer="3659" to-port="0" /> <edge from-layer="3653" from-port="0" to-layer="3654" to-port="0" /> <edge from-layer="3654" from-port="1" to-layer="3668" to-port="0" /> <edge from-layer="3655" from-port="0" to-layer="3656" to-port="0" /> <edge from-layer="3656" from-port="1" to-layer="3666" to-port="0" /> <edge from-layer="3657" from-port="0" to-layer="3658" to-port="0" /> <edge from-layer="3658" from-port="1" to-layer="3659" to-port="1" /> <edge from-layer="3659" from-port="2" to-layer="3661" to-port="0" /> <edge from-layer="3660" from-port="0" to-layer="3661" to-port="1" /> <edge from-layer="3661" from-port="2" to-layer="3664" to-port="0" /> <edge from-layer="3662" from-port="0" to-layer="3663" to-port="0" /> <edge from-layer="3663" from-port="1" to-layer="3664" to-port="1" /> <edge from-layer="3664" from-port="2" to-layer="3665" to-port="0" /> <edge from-layer="3665" from-port="1" to-layer="3666" to-port="1" /> <edge from-layer="3666" from-port="2" to-layer="3667" to-port="1" /> <edge from-layer="3667" from-port="2" to-layer="3668" to-port="1" /> <edge from-layer="3668" from-port="2" to-layer="3671" to-port="0" /> <edge from-layer="3669" from-port="0" to-layer="3670" to-port="0" /> <edge from-layer="3670" from-port="1" to-layer="3671" to-port="1" /> <edge from-layer="3671" from-port="2" to-layer="3672" to-port="0" /> <edge from-layer="3672" from-port="4" to-layer="3674" to-port="0" /> <edge from-layer="3672" from-port="3" to-layer="3673" to-port="0" /> <edge from-layer="3673" from-port="1" to-layer="3674" to-port="1" /> <edge from-layer="3674" from-port="2" to-layer="3677" to-port="0" /> <edge from-layer="3675" from-port="0" to-layer="3676" to-port="0" /> <edge from-layer="3676" from-port="1" to-layer="3677" to-port="1" /> <edge from-layer="3677" from-port="2" to-layer="3678" to-port="1" /> <edge from-layer="3678" from-port="2" to-layer="3685" to-port="0" /> <edge from-layer="3678" from-port="2" to-layer="3782" to-port="0" /> <edge from-layer="3678" from-port="2" to-layer="3693" to-port="0" /> <edge from-layer="3679" from-port="0" to-layer="3680" to-port="0" /> <edge from-layer="3680" from-port="1" to-layer="3694" to-port="0" /> <edge from-layer="3681" from-port="0" to-layer="3682" to-port="0" /> <edge from-layer="3682" from-port="1" to-layer="3692" to-port="0" /> <edge from-layer="3683" from-port="0" to-layer="3684" to-port="0" /> <edge from-layer="3684" from-port="1" to-layer="3685" to-port="1" /> <edge from-layer="3685" from-port="2" to-layer="3687" to-port="0" /> <edge from-layer="3686" from-port="0" to-layer="3687" to-port="1" /> <edge from-layer="3687" from-port="2" to-layer="3690" to-port="0" /> <edge from-layer="3688" from-port="0" to-layer="3689" to-port="0" /> <edge from-layer="3689" from-port="1" to-layer="3690" to-port="1" /> <edge from-layer="3690" from-port="2" to-layer="3691" to-port="0" /> <edge from-layer="3691" from-port="1" to-layer="3692" to-port="1" /> <edge from-layer="3692" from-port="2" to-layer="3693" to-port="1" /> <edge from-layer="3693" from-port="2" to-layer="3694" to-port="1" /> <edge from-layer="3694" from-port="2" to-layer="3697" to-port="0" /> <edge from-layer="3695" from-port="0" to-layer="3696" to-port="0" /> <edge from-layer="3696" from-port="1" to-layer="3697" to-port="1" /> <edge from-layer="3697" from-port="2" to-layer="3734" to-port="0" /> <edge from-layer="3697" from-port="2" to-layer="3768" to-port="0" /> <edge from-layer="3697" from-port="2" to-layer="3701" to-port="0" /> <edge from-layer="3698" from-port="0" to-layer="3701" to-port="1" /> <edge from-layer="3699" from-port="0" to-layer="3701" to-port="2" /> <edge from-layer="3700" from-port="0" to-layer="3701" to-port="3" /> <edge from-layer="3701" from-port="5" to-layer="3703" to-port="0" /> <edge from-layer="3702" from-port="0" to-layer="3703" to-port="1" /> <edge from-layer="3703" from-port="2" to-layer="3705" to-port="0" /> <edge from-layer="3704" from-port="0" to-layer="3705" to-port="1" /> <edge from-layer="3705" from-port="2" to-layer="3717" to-port="0" /> <edge from-layer="3705" from-port="2" to-layer="3706" to-port="0" /> <edge from-layer="3705" from-port="2" to-layer="3710" to-port="0" /> <edge from-layer="3706" from-port="2" to-layer="3720" to-port="0" /> <edge from-layer="3707" from-port="0" to-layer="3710" to-port="1" /> <edge from-layer="3708" from-port="0" to-layer="3710" to-port="2" /> <edge from-layer="3709" from-port="0" to-layer="3710" to-port="3" /> <edge from-layer="3710" from-port="5" to-layer="3713" to-port="0" /> <edge from-layer="3711" from-port="0" to-layer="3712" to-port="0" /> <edge from-layer="3712" from-port="1" to-layer="3713" to-port="1" /> <edge from-layer="3713" from-port="2" to-layer="3718" to-port="0" /> <edge from-layer="3714" from-port="0" to-layer="3717" to-port="1" /> <edge from-layer="3715" from-port="0" to-layer="3717" to-port="2" /> <edge from-layer="3716" from-port="0" to-layer="3717" to-port="3" /> <edge from-layer="3717" from-port="5" to-layer="3718" to-port="1" /> <edge from-layer="3718" from-port="2" to-layer="3719" to-port="0" /> <edge from-layer="3719" from-port="2" to-layer="3720" to-port="1" /> <edge from-layer="3720" from-port="2" to-layer="3774" to-port="0" /> <edge from-layer="3721" from-port="0" to-layer="3722" to-port="0" /> <edge from-layer="3722" from-port="1" to-layer="3727" to-port="0" /> <edge from-layer="3723" from-port="0" to-layer="3726" to-port="1" /> <edge from-layer="3724" from-port="0" to-layer="3726" to-port="2" /> <edge from-layer="3725" from-port="0" to-layer="3726" to-port="3" /> <edge from-layer="3726" from-port="4" to-layer="3727" to-port="1" /> <edge from-layer="3727" from-port="2" to-layer="3728" to-port="0" /> <edge from-layer="3728" from-port="1" to-layer="3730" to-port="0" /> <edge from-layer="3729" from-port="0" to-layer="3730" to-port="2" /> <edge from-layer="3730" from-port="3" to-layer="3754" to-port="0" /> <edge from-layer="3731" from-port="0" to-layer="3734" to-port="1" /> <edge from-layer="3732" from-port="0" to-layer="3734" to-port="2" /> <edge from-layer="3733" from-port="0" to-layer="3734" to-port="3" /> <edge from-layer="3734" from-port="5" to-layer="3736" to-port="0" /> <edge from-layer="3735" from-port="0" to-layer="3736" to-port="1" /> <edge from-layer="3736" from-port="2" to-layer="3738" to-port="0" /> <edge from-layer="3737" from-port="0" to-layer="3738" to-port="1" /> <edge from-layer="3738" from-port="2" to-layer="3750" to-port="0" /> <edge from-layer="3738" from-port="2" to-layer="3743" to-port="0" /> <edge from-layer="3738" from-port="2" to-layer="3739" to-port="0" /> <edge from-layer="3739" from-port="2" to-layer="3753" to-port="0" /> <edge from-layer="3740" from-port="0" to-layer="3743" to-port="1" /> <edge from-layer="3741" from-port="0" to-layer="3743" to-port="2" /> <edge from-layer="3742" from-port="0" to-layer="3743" to-port="3" /> <edge from-layer="3743" from-port="5" to-layer="3746" to-port="0" /> <edge from-layer="3744" from-port="0" to-layer="3745" to-port="0" /> <edge from-layer="3745" from-port="1" to-layer="3746" to-port="1" /> <edge from-layer="3746" from-port="2" to-layer="3751" to-port="0" /> <edge from-layer="3747" from-port="0" to-layer="3750" to-port="1" /> <edge from-layer="3748" from-port="0" to-layer="3750" to-port="2" /> <edge from-layer="3749" from-port="0" to-layer="3750" to-port="3" /> <edge from-layer="3750" from-port="5" to-layer="3751" to-port="1" /> <edge from-layer="3751" from-port="2" to-layer="3752" to-port="0" /> <edge from-layer="3752" from-port="2" to-layer="3753" to-port="1" /> <edge from-layer="3753" from-port="2" to-layer="3754" to-port="1" /> <edge from-layer="3754" from-port="2" to-layer="4270" to-port="0" /> <edge from-layer="3754" from-port="2" to-layer="3774" to-port="1" /> <edge from-layer="3755" from-port="0" to-layer="3756" to-port="0" /> <edge from-layer="3756" from-port="1" to-layer="3761" to-port="0" /> <edge from-layer="3757" from-port="0" to-layer="3760" to-port="1" /> <edge from-layer="3758" from-port="0" to-layer="3760" to-port="2" /> <edge from-layer="3759" from-port="0" to-layer="3760" to-port="3" /> <edge from-layer="3760" from-port="4" to-layer="3761" to-port="1" /> <edge from-layer="3761" from-port="2" to-layer="3762" to-port="0" /> <edge from-layer="3762" from-port="1" to-layer="3764" to-port="0" /> <edge from-layer="3763" from-port="0" to-layer="3764" to-port="2" /> <edge from-layer="3764" from-port="3" to-layer="3773" to-port="0" /> <edge from-layer="3765" from-port="0" to-layer="3768" to-port="1" /> <edge from-layer="3766" from-port="0" to-layer="3768" to-port="2" /> <edge from-layer="3767" from-port="0" to-layer="3768" to-port="3" /> <edge from-layer="3768" from-port="5" to-layer="3770" to-port="0" /> <edge from-layer="3769" from-port="0" to-layer="3770" to-port="1" /> <edge from-layer="3770" from-port="2" to-layer="3772" to-port="0" /> <edge from-layer="3771" from-port="0" to-layer="3772" to-port="1" /> <edge from-layer="3772" from-port="2" to-layer="3773" to-port="1" /> <edge from-layer="3773" from-port="2" to-layer="4269" to-port="0" /> <edge from-layer="3773" from-port="2" to-layer="3774" to-port="2" /> <edge from-layer="3774" from-port="4" to-layer="3776" to-port="0" /> <edge from-layer="3775" from-port="0" to-layer="3776" to-port="1" /> <edge from-layer="3776" from-port="2" to-layer="3778" to-port="0" /> <edge from-layer="3777" from-port="0" to-layer="3778" to-port="1" /> <edge from-layer="3778" from-port="2" to-layer="3781" to-port="0" /> <edge from-layer="3779" from-port="0" to-layer="3780" to-port="0" /> <edge from-layer="3780" from-port="1" to-layer="3781" to-port="1" /> <edge from-layer="3781" from-port="2" to-layer="3782" to-port="1" /> <edge from-layer="3782" from-port="2" to-layer="3797" to-port="0" /> <edge from-layer="3782" from-port="2" to-layer="3808" to-port="0" /> <edge from-layer="3782" from-port="2" to-layer="3789" to-port="0" /> <edge from-layer="3783" from-port="0" to-layer="3784" to-port="0" /> <edge from-layer="3784" from-port="1" to-layer="3798" to-port="0" /> <edge from-layer="3785" from-port="0" to-layer="3786" to-port="0" /> <edge from-layer="3786" from-port="1" to-layer="3796" to-port="0" /> <edge from-layer="3787" from-port="0" to-layer="3788" to-port="0" /> <edge from-layer="3788" from-port="1" to-layer="3789" to-port="1" /> <edge from-layer="3789" from-port="2" to-layer="3791" to-port="0" /> <edge from-layer="3790" from-port="0" to-layer="3791" to-port="1" /> <edge from-layer="3791" from-port="2" to-layer="3794" to-port="0" /> <edge from-layer="3792" from-port="0" to-layer="3793" to-port="0" /> <edge from-layer="3793" from-port="1" to-layer="3794" to-port="1" /> <edge from-layer="3794" from-port="2" to-layer="3795" to-port="0" /> <edge from-layer="3795" from-port="1" to-layer="3796" to-port="1" /> <edge from-layer="3796" from-port="2" to-layer="3797" to-port="1" /> <edge from-layer="3797" from-port="2" to-layer="3798" to-port="1" /> <edge from-layer="3798" from-port="2" to-layer="3801" to-port="0" /> <edge from-layer="3799" from-port="0" to-layer="3800" to-port="0" /> <edge from-layer="3800" from-port="1" to-layer="3801" to-port="1" /> <edge from-layer="3801" from-port="2" to-layer="3802" to-port="0" /> <edge from-layer="3802" from-port="3" to-layer="3803" to-port="0" /> <edge from-layer="3802" from-port="4" to-layer="3804" to-port="0" /> <edge from-layer="3803" from-port="1" to-layer="3804" to-port="1" /> <edge from-layer="3804" from-port="2" to-layer="3807" to-port="0" /> <edge from-layer="3805" from-port="0" to-layer="3806" to-port="0" /> <edge from-layer="3806" from-port="1" to-layer="3807" to-port="1" /> <edge from-layer="3807" from-port="2" to-layer="3808" to-port="1" /> <edge from-layer="3808" from-port="2" to-layer="3823" to-port="0" /> <edge from-layer="3808" from-port="2" to-layer="3912" to-port="0" /> <edge from-layer="3808" from-port="2" to-layer="3815" to-port="0" /> <edge from-layer="3809" from-port="0" to-layer="3810" to-port="0" /> <edge from-layer="3810" from-port="1" to-layer="3824" to-port="0" /> <edge from-layer="3811" from-port="0" to-layer="3812" to-port="0" /> <edge from-layer="3812" from-port="1" to-layer="3822" to-port="0" /> <edge from-layer="3813" from-port="0" to-layer="3814" to-port="0" /> <edge from-layer="3814" from-port="1" to-layer="3815" to-port="1" /> <edge from-layer="3815" from-port="2" to-layer="3817" to-port="0" /> <edge from-layer="3816" from-port="0" to-layer="3817" to-port="1" /> <edge from-layer="3817" from-port="2" to-layer="3820" to-port="0" /> <edge from-layer="3818" from-port="0" to-layer="3819" to-port="0" /> <edge from-layer="3819" from-port="1" to-layer="3820" to-port="1" /> <edge from-layer="3820" from-port="2" to-layer="3821" to-port="0" /> <edge from-layer="3821" from-port="1" to-layer="3822" to-port="1" /> <edge from-layer="3822" from-port="2" to-layer="3823" to-port="1" /> <edge from-layer="3823" from-port="2" to-layer="3824" to-port="1" /> <edge from-layer="3824" from-port="2" to-layer="3827" to-port="0" /> <edge from-layer="3825" from-port="0" to-layer="3826" to-port="0" /> <edge from-layer="3826" from-port="1" to-layer="3827" to-port="1" /> <edge from-layer="3827" from-port="2" to-layer="3864" to-port="0" /> <edge from-layer="3827" from-port="2" to-layer="3898" to-port="0" /> <edge from-layer="3827" from-port="2" to-layer="3831" to-port="0" /> <edge from-layer="3828" from-port="0" to-layer="3831" to-port="1" /> <edge from-layer="3829" from-port="0" to-layer="3831" to-port="2" /> <edge from-layer="3830" from-port="0" to-layer="3831" to-port="3" /> <edge from-layer="3831" from-port="5" to-layer="3833" to-port="0" /> <edge from-layer="3832" from-port="0" to-layer="3833" to-port="1" /> <edge from-layer="3833" from-port="2" to-layer="3835" to-port="0" /> <edge from-layer="3834" from-port="0" to-layer="3835" to-port="1" /> <edge from-layer="3835" from-port="2" to-layer="3836" to-port="0" /> <edge from-layer="3835" from-port="2" to-layer="3840" to-port="0" /> <edge from-layer="3835" from-port="2" to-layer="3847" to-port="0" /> <edge from-layer="3836" from-port="2" to-layer="3850" to-port="0" /> <edge from-layer="3837" from-port="0" to-layer="3840" to-port="1" /> <edge from-layer="3838" from-port="0" to-layer="3840" to-port="2" /> <edge from-layer="3839" from-port="0" to-layer="3840" to-port="3" /> <edge from-layer="3840" from-port="5" to-layer="3843" to-port="0" /> <edge from-layer="3841" from-port="0" to-layer="3842" to-port="0" /> <edge from-layer="3842" from-port="1" to-layer="3843" to-port="1" /> <edge from-layer="3843" from-port="2" to-layer="3848" to-port="0" /> <edge from-layer="3844" from-port="0" to-layer="3847" to-port="1" /> <edge from-layer="3845" from-port="0" to-layer="3847" to-port="2" /> <edge from-layer="3846" from-port="0" to-layer="3847" to-port="3" /> <edge from-layer="3847" from-port="5" to-layer="3848" to-port="1" /> <edge from-layer="3848" from-port="2" to-layer="3849" to-port="0" /> <edge from-layer="3849" from-port="2" to-layer="3850" to-port="1" /> <edge from-layer="3850" from-port="2" to-layer="3904" to-port="0" /> <edge from-layer="3851" from-port="0" to-layer="3852" to-port="0" /> <edge from-layer="3852" from-port="1" to-layer="3857" to-port="0" /> <edge from-layer="3853" from-port="0" to-layer="3856" to-port="1" /> <edge from-layer="3854" from-port="0" to-layer="3856" to-port="2" /> <edge from-layer="3855" from-port="0" to-layer="3856" to-port="3" /> <edge from-layer="3856" from-port="4" to-layer="3857" to-port="1" /> <edge from-layer="3857" from-port="2" to-layer="3858" to-port="0" /> <edge from-layer="3858" from-port="1" to-layer="3860" to-port="0" /> <edge from-layer="3859" from-port="0" to-layer="3860" to-port="2" /> <edge from-layer="3860" from-port="3" to-layer="3884" to-port="0" /> <edge from-layer="3861" from-port="0" to-layer="3864" to-port="1" /> <edge from-layer="3862" from-port="0" to-layer="3864" to-port="2" /> <edge from-layer="3863" from-port="0" to-layer="3864" to-port="3" /> <edge from-layer="3864" from-port="5" to-layer="3866" to-port="0" /> <edge from-layer="3865" from-port="0" to-layer="3866" to-port="1" /> <edge from-layer="3866" from-port="2" to-layer="3868" to-port="0" /> <edge from-layer="3867" from-port="0" to-layer="3868" to-port="1" /> <edge from-layer="3868" from-port="2" to-layer="3869" to-port="0" /> <edge from-layer="3868" from-port="2" to-layer="3873" to-port="0" /> <edge from-layer="3868" from-port="2" to-layer="3880" to-port="0" /> <edge from-layer="3869" from-port="2" to-layer="3883" to-port="0" /> <edge from-layer="3870" from-port="0" to-layer="3873" to-port="1" /> <edge from-layer="3871" from-port="0" to-layer="3873" to-port="2" /> <edge from-layer="3872" from-port="0" to-layer="3873" to-port="3" /> <edge from-layer="3873" from-port="5" to-layer="3876" to-port="0" /> <edge from-layer="3874" from-port="0" to-layer="3875" to-port="0" /> <edge from-layer="3875" from-port="1" to-layer="3876" to-port="1" /> <edge from-layer="3876" from-port="2" to-layer="3881" to-port="0" /> <edge from-layer="3877" from-port="0" to-layer="3880" to-port="1" /> <edge from-layer="3878" from-port="0" to-layer="3880" to-port="2" /> <edge from-layer="3879" from-port="0" to-layer="3880" to-port="3" /> <edge from-layer="3880" from-port="5" to-layer="3881" to-port="1" /> <edge from-layer="3881" from-port="2" to-layer="3882" to-port="0" /> <edge from-layer="3882" from-port="2" to-layer="3883" to-port="1" /> <edge from-layer="3883" from-port="2" to-layer="3884" to-port="1" /> <edge from-layer="3884" from-port="2" to-layer="4268" to-port="0" /> <edge from-layer="3884" from-port="2" to-layer="3904" to-port="1" /> <edge from-layer="3885" from-port="0" to-layer="3886" to-port="0" /> <edge from-layer="3886" from-port="1" to-layer="3891" to-port="0" /> <edge from-layer="3887" from-port="0" to-layer="3890" to-port="1" /> <edge from-layer="3888" from-port="0" to-layer="3890" to-port="2" /> <edge from-layer="3889" from-port="0" to-layer="3890" to-port="3" /> <edge from-layer="3890" from-port="4" to-layer="3891" to-port="1" /> <edge from-layer="3891" from-port="2" to-layer="3892" to-port="0" /> <edge from-layer="3892" from-port="1" to-layer="3894" to-port="0" /> <edge from-layer="3893" from-port="0" to-layer="3894" to-port="2" /> <edge from-layer="3894" from-port="3" to-layer="3903" to-port="0" /> <edge from-layer="3895" from-port="0" to-layer="3898" to-port="1" /> <edge from-layer="3896" from-port="0" to-layer="3898" to-port="2" /> <edge from-layer="3897" from-port="0" to-layer="3898" to-port="3" /> <edge from-layer="3898" from-port="5" to-layer="3900" to-port="0" /> <edge from-layer="3899" from-port="0" to-layer="3900" to-port="1" /> <edge from-layer="3900" from-port="2" to-layer="3902" to-port="0" /> <edge from-layer="3901" from-port="0" to-layer="3902" to-port="1" /> <edge from-layer="3902" from-port="2" to-layer="3903" to-port="1" /> <edge from-layer="3903" from-port="2" to-layer="3904" to-port="2" /> <edge from-layer="3903" from-port="2" to-layer="4267" to-port="0" /> <edge from-layer="3904" from-port="4" to-layer="3906" to-port="0" /> <edge from-layer="3905" from-port="0" to-layer="3906" to-port="1" /> <edge from-layer="3906" from-port="2" to-layer="3908" to-port="0" /> <edge from-layer="3907" from-port="0" to-layer="3908" to-port="1" /> <edge from-layer="3908" from-port="2" to-layer="3911" to-port="0" /> <edge from-layer="3909" from-port="0" to-layer="3910" to-port="0" /> <edge from-layer="3910" from-port="1" to-layer="3911" to-port="1" /> <edge from-layer="3911" from-port="2" to-layer="3912" to-port="1" /> <edge from-layer="3912" from-port="2" to-layer="3919" to-port="0" /> <edge from-layer="3912" from-port="2" to-layer="3927" to-port="0" /> <edge from-layer="3912" from-port="2" to-layer="3938" to-port="0" /> <edge from-layer="3913" from-port="0" to-layer="3914" to-port="0" /> <edge from-layer="3914" from-port="1" to-layer="3928" to-port="0" /> <edge from-layer="3915" from-port="0" to-layer="3916" to-port="0" /> <edge from-layer="3916" from-port="1" to-layer="3926" to-port="0" /> <edge from-layer="3917" from-port="0" to-layer="3918" to-port="0" /> <edge from-layer="3918" from-port="1" to-layer="3919" to-port="1" /> <edge from-layer="3919" from-port="2" to-layer="3921" to-port="0" /> <edge from-layer="3920" from-port="0" to-layer="3921" to-port="1" /> <edge from-layer="3921" from-port="2" to-layer="3924" to-port="0" /> <edge from-layer="3922" from-port="0" to-layer="3923" to-port="0" /> <edge from-layer="3923" from-port="1" to-layer="3924" to-port="1" /> <edge from-layer="3924" from-port="2" to-layer="3925" to-port="0" /> <edge from-layer="3925" from-port="1" to-layer="3926" to-port="1" /> <edge from-layer="3926" from-port="2" to-layer="3927" to-port="1" /> <edge from-layer="3927" from-port="2" to-layer="3928" to-port="1" /> <edge from-layer="3928" from-port="2" to-layer="3931" to-port="0" /> <edge from-layer="3929" from-port="0" to-layer="3930" to-port="0" /> <edge from-layer="3930" from-port="1" to-layer="3931" to-port="1" /> <edge from-layer="3931" from-port="2" to-layer="3932" to-port="0" /> <edge from-layer="3932" from-port="3" to-layer="3933" to-port="0" /> <edge from-layer="3932" from-port="4" to-layer="3934" to-port="0" /> <edge from-layer="3933" from-port="1" to-layer="3934" to-port="1" /> <edge from-layer="3934" from-port="2" to-layer="3937" to-port="0" /> <edge from-layer="3935" from-port="0" to-layer="3936" to-port="0" /> <edge from-layer="3936" from-port="1" to-layer="3937" to-port="1" /> <edge from-layer="3937" from-port="2" to-layer="3938" to-port="1" /> <edge from-layer="3938" from-port="2" to-layer="3953" to-port="0" /> <edge from-layer="3938" from-port="2" to-layer="4042" to-port="0" /> <edge from-layer="3938" from-port="2" to-layer="3945" to-port="0" /> <edge from-layer="3939" from-port="0" to-layer="3940" to-port="0" /> <edge from-layer="3940" from-port="1" to-layer="3954" to-port="0" /> <edge from-layer="3941" from-port="0" to-layer="3942" to-port="0" /> <edge from-layer="3942" from-port="1" to-layer="3952" to-port="0" /> <edge from-layer="3943" from-port="0" to-layer="3944" to-port="0" /> <edge from-layer="3944" from-port="1" to-layer="3945" to-port="1" /> <edge from-layer="3945" from-port="2" to-layer="3947" to-port="0" /> <edge from-layer="3946" from-port="0" to-layer="3947" to-port="1" /> <edge from-layer="3947" from-port="2" to-layer="3950" to-port="0" /> <edge from-layer="3948" from-port="0" to-layer="3949" to-port="0" /> <edge from-layer="3949" from-port="1" to-layer="3950" to-port="1" /> <edge from-layer="3950" from-port="2" to-layer="3951" to-port="0" /> <edge from-layer="3951" from-port="1" to-layer="3952" to-port="1" /> <edge from-layer="3952" from-port="2" to-layer="3953" to-port="1" /> <edge from-layer="3953" from-port="2" to-layer="3954" to-port="1" /> <edge from-layer="3954" from-port="2" to-layer="3957" to-port="0" /> <edge from-layer="3955" from-port="0" to-layer="3956" to-port="0" /> <edge from-layer="3956" from-port="1" to-layer="3957" to-port="1" /> <edge from-layer="3957" from-port="2" to-layer="3961" to-port="0" /> <edge from-layer="3957" from-port="2" to-layer="4028" to-port="0" /> <edge from-layer="3957" from-port="2" to-layer="3994" to-port="0" /> <edge from-layer="3958" from-port="0" to-layer="3961" to-port="1" /> <edge from-layer="3959" from-port="0" to-layer="3961" to-port="2" /> <edge from-layer="3960" from-port="0" to-layer="3961" to-port="3" /> <edge from-layer="3961" from-port="5" to-layer="3963" to-port="0" /> <edge from-layer="3962" from-port="0" to-layer="3963" to-port="1" /> <edge from-layer="3963" from-port="2" to-layer="3965" to-port="0" /> <edge from-layer="3964" from-port="0" to-layer="3965" to-port="1" /> <edge from-layer="3965" from-port="2" to-layer="3977" to-port="0" /> <edge from-layer="3965" from-port="2" to-layer="3970" to-port="0" /> <edge from-layer="3965" from-port="2" to-layer="3966" to-port="0" /> <edge from-layer="3966" from-port="2" to-layer="3980" to-port="0" /> <edge from-layer="3967" from-port="0" to-layer="3970" to-port="1" /> <edge from-layer="3968" from-port="0" to-layer="3970" to-port="2" /> <edge from-layer="3969" from-port="0" to-layer="3970" to-port="3" /> <edge from-layer="3970" from-port="5" to-layer="3973" to-port="0" /> <edge from-layer="3971" from-port="0" to-layer="3972" to-port="0" /> <edge from-layer="3972" from-port="1" to-layer="3973" to-port="1" /> <edge from-layer="3973" from-port="2" to-layer="3978" to-port="0" /> <edge from-layer="3974" from-port="0" to-layer="3977" to-port="1" /> <edge from-layer="3975" from-port="0" to-layer="3977" to-port="2" /> <edge from-layer="3976" from-port="0" to-layer="3977" to-port="3" /> <edge from-layer="3977" from-port="5" to-layer="3978" to-port="1" /> <edge from-layer="3978" from-port="2" to-layer="3979" to-port="0" /> <edge from-layer="3979" from-port="2" to-layer="3980" to-port="1" /> <edge from-layer="3980" from-port="2" to-layer="4034" to-port="0" /> <edge from-layer="3981" from-port="0" to-layer="3982" to-port="0" /> <edge from-layer="3982" from-port="1" to-layer="3987" to-port="0" /> <edge from-layer="3983" from-port="0" to-layer="3986" to-port="1" /> <edge from-layer="3984" from-port="0" to-layer="3986" to-port="2" /> <edge from-layer="3985" from-port="0" to-layer="3986" to-port="3" /> <edge from-layer="3986" from-port="4" to-layer="3987" to-port="1" /> <edge from-layer="3987" from-port="2" to-layer="3988" to-port="0" /> <edge from-layer="3988" from-port="1" to-layer="3990" to-port="0" /> <edge from-layer="3989" from-port="0" to-layer="3990" to-port="2" /> <edge from-layer="3990" from-port="3" to-layer="4014" to-port="0" /> <edge from-layer="3991" from-port="0" to-layer="3994" to-port="1" /> <edge from-layer="3992" from-port="0" to-layer="3994" to-port="2" /> <edge from-layer="3993" from-port="0" to-layer="3994" to-port="3" /> <edge from-layer="3994" from-port="5" to-layer="3996" to-port="0" /> <edge from-layer="3995" from-port="0" to-layer="3996" to-port="1" /> <edge from-layer="3996" from-port="2" to-layer="3998" to-port="0" /> <edge from-layer="3997" from-port="0" to-layer="3998" to-port="1" /> <edge from-layer="3998" from-port="2" to-layer="3999" to-port="0" /> <edge from-layer="3998" from-port="2" to-layer="4003" to-port="0" /> <edge from-layer="3998" from-port="2" to-layer="4010" to-port="0" /> <edge from-layer="3999" from-port="2" to-layer="4013" to-port="0" /> <edge from-layer="4000" from-port="0" to-layer="4003" to-port="1" /> <edge from-layer="4001" from-port="0" to-layer="4003" to-port="2" /> <edge from-layer="4002" from-port="0" to-layer="4003" to-port="3" /> <edge from-layer="4003" from-port="5" to-layer="4006" to-port="0" /> <edge from-layer="4004" from-port="0" to-layer="4005" to-port="0" /> <edge from-layer="4005" from-port="1" to-layer="4006" to-port="1" /> <edge from-layer="4006" from-port="2" to-layer="4011" to-port="0" /> <edge from-layer="4007" from-port="0" to-layer="4010" to-port="1" /> <edge from-layer="4008" from-port="0" to-layer="4010" to-port="2" /> <edge from-layer="4009" from-port="0" to-layer="4010" to-port="3" /> <edge from-layer="4010" from-port="5" to-layer="4011" to-port="1" /> <edge from-layer="4011" from-port="2" to-layer="4012" to-port="0" /> <edge from-layer="4012" from-port="2" to-layer="4013" to-port="1" /> <edge from-layer="4013" from-port="2" to-layer="4014" to-port="1" /> <edge from-layer="4014" from-port="2" to-layer="4034" to-port="1" /> <edge from-layer="4014" from-port="2" to-layer="4266" to-port="0" /> <edge from-layer="4015" from-port="0" to-layer="4016" to-port="0" /> <edge from-layer="4016" from-port="1" to-layer="4021" to-port="0" /> <edge from-layer="4017" from-port="0" to-layer="4020" to-port="1" /> <edge from-layer="4018" from-port="0" to-layer="4020" to-port="2" /> <edge from-layer="4019" from-port="0" to-layer="4020" to-port="3" /> <edge from-layer="4020" from-port="4" to-layer="4021" to-port="1" /> <edge from-layer="4021" from-port="2" to-layer="4022" to-port="0" /> <edge from-layer="4022" from-port="1" to-layer="4024" to-port="0" /> <edge from-layer="4023" from-port="0" to-layer="4024" to-port="2" /> <edge from-layer="4024" from-port="3" to-layer="4033" to-port="0" /> <edge from-layer="4025" from-port="0" to-layer="4028" to-port="1" /> <edge from-layer="4026" from-port="0" to-layer="4028" to-port="2" /> <edge from-layer="4027" from-port="0" to-layer="4028" to-port="3" /> <edge from-layer="4028" from-port="5" to-layer="4030" to-port="0" /> <edge from-layer="4029" from-port="0" to-layer="4030" to-port="1" /> <edge from-layer="4030" from-port="2" to-layer="4032" to-port="0" /> <edge from-layer="4031" from-port="0" to-layer="4032" to-port="1" /> <edge from-layer="4032" from-port="2" to-layer="4033" to-port="1" /> <edge from-layer="4033" from-port="2" to-layer="4034" to-port="2" /> <edge from-layer="4033" from-port="2" to-layer="4265" to-port="0" /> <edge from-layer="4034" from-port="4" to-layer="4036" to-port="0" /> <edge from-layer="4035" from-port="0" to-layer="4036" to-port="1" /> <edge from-layer="4036" from-port="2" to-layer="4038" to-port="0" /> <edge from-layer="4037" from-port="0" to-layer="4038" to-port="1" /> <edge from-layer="4038" from-port="2" to-layer="4041" to-port="0" /> <edge from-layer="4039" from-port="0" to-layer="4040" to-port="0" /> <edge from-layer="4040" from-port="1" to-layer="4041" to-port="1" /> <edge from-layer="4041" from-port="2" to-layer="4042" to-port="1" /> <edge from-layer="4042" from-port="2" to-layer="4049" to-port="0" /> <edge from-layer="4042" from-port="2" to-layer="4068" to-port="0" /> <edge from-layer="4042" from-port="2" to-layer="4057" to-port="0" /> <edge from-layer="4043" from-port="0" to-layer="4044" to-port="0" /> <edge from-layer="4044" from-port="1" to-layer="4058" to-port="0" /> <edge from-layer="4045" from-port="0" to-layer="4046" to-port="0" /> <edge from-layer="4046" from-port="1" to-layer="4056" to-port="0" /> <edge from-layer="4047" from-port="0" to-layer="4048" to-port="0" /> <edge from-layer="4048" from-port="1" to-layer="4049" to-port="1" /> <edge from-layer="4049" from-port="2" to-layer="4051" to-port="0" /> <edge from-layer="4050" from-port="0" to-layer="4051" to-port="1" /> <edge from-layer="4051" from-port="2" to-layer="4054" to-port="0" /> <edge from-layer="4052" from-port="0" to-layer="4053" to-port="0" /> <edge from-layer="4053" from-port="1" to-layer="4054" to-port="1" /> <edge from-layer="4054" from-port="2" to-layer="4055" to-port="0" /> <edge from-layer="4055" from-port="1" to-layer="4056" to-port="1" /> <edge from-layer="4056" from-port="2" to-layer="4057" to-port="1" /> <edge from-layer="4057" from-port="2" to-layer="4058" to-port="1" /> <edge from-layer="4058" from-port="2" to-layer="4061" to-port="0" /> <edge from-layer="4059" from-port="0" to-layer="4060" to-port="0" /> <edge from-layer="4060" from-port="1" to-layer="4061" to-port="1" /> <edge from-layer="4061" from-port="2" to-layer="4062" to-port="0" /> <edge from-layer="4062" from-port="3" to-layer="4063" to-port="0" /> <edge from-layer="4062" from-port="4" to-layer="4064" to-port="0" /> <edge from-layer="4063" from-port="1" to-layer="4064" to-port="1" /> <edge from-layer="4064" from-port="2" to-layer="4067" to-port="0" /> <edge from-layer="4065" from-port="0" to-layer="4066" to-port="0" /> <edge from-layer="4066" from-port="1" to-layer="4067" to-port="1" /> <edge from-layer="4067" from-port="2" to-layer="4068" to-port="1" /> <edge from-layer="4068" from-port="2" to-layer="4075" to-port="0" /> <edge from-layer="4068" from-port="2" to-layer="4083" to-port="0" /> <edge from-layer="4068" from-port="2" to-layer="4172" to-port="0" /> <edge from-layer="4069" from-port="0" to-layer="4070" to-port="0" /> <edge from-layer="4070" from-port="1" to-layer="4084" to-port="0" /> <edge from-layer="4071" from-port="0" to-layer="4072" to-port="0" /> <edge from-layer="4072" from-port="1" to-layer="4082" to-port="0" /> <edge from-layer="4073" from-port="0" to-layer="4074" to-port="0" /> <edge from-layer="4074" from-port="1" to-layer="4075" to-port="1" /> <edge from-layer="4075" from-port="2" to-layer="4077" to-port="0" /> <edge from-layer="4076" from-port="0" to-layer="4077" to-port="1" /> <edge from-layer="4077" from-port="2" to-layer="4080" to-port="0" /> <edge from-layer="4078" from-port="0" to-layer="4079" to-port="0" /> <edge from-layer="4079" from-port="1" to-layer="4080" to-port="1" /> <edge from-layer="4080" from-port="2" to-layer="4081" to-port="0" /> <edge from-layer="4081" from-port="1" to-layer="4082" to-port="1" /> <edge from-layer="4082" from-port="2" to-layer="4083" to-port="1" /> <edge from-layer="4083" from-port="2" to-layer="4084" to-port="1" /> <edge from-layer="4084" from-port="2" to-layer="4087" to-port="0" /> <edge from-layer="4085" from-port="0" to-layer="4086" to-port="0" /> <edge from-layer="4086" from-port="1" to-layer="4087" to-port="1" /> <edge from-layer="4087" from-port="2" to-layer="4158" to-port="0" /> <edge from-layer="4087" from-port="2" to-layer="4091" to-port="0" /> <edge from-layer="4087" from-port="2" to-layer="4124" to-port="0" /> <edge from-layer="4088" from-port="0" to-layer="4091" to-port="1" /> <edge from-layer="4089" from-port="0" to-layer="4091" to-port="2" /> <edge from-layer="4090" from-port="0" to-layer="4091" to-port="3" /> <edge from-layer="4091" from-port="5" to-layer="4093" to-port="0" /> <edge from-layer="4092" from-port="0" to-layer="4093" to-port="1" /> <edge from-layer="4093" from-port="2" to-layer="4095" to-port="0" /> <edge from-layer="4094" from-port="0" to-layer="4095" to-port="1" /> <edge from-layer="4095" from-port="2" to-layer="4100" to-port="0" /> <edge from-layer="4095" from-port="2" to-layer="4096" to-port="0" /> <edge from-layer="4095" from-port="2" to-layer="4107" to-port="0" /> <edge from-layer="4096" from-port="2" to-layer="4110" to-port="0" /> <edge from-layer="4097" from-port="0" to-layer="4100" to-port="1" /> <edge from-layer="4098" from-port="0" to-layer="4100" to-port="2" /> <edge from-layer="4099" from-port="0" to-layer="4100" to-port="3" /> <edge from-layer="4100" from-port="5" to-layer="4103" to-port="0" /> <edge from-layer="4101" from-port="0" to-layer="4102" to-port="0" /> <edge from-layer="4102" from-port="1" to-layer="4103" to-port="1" /> <edge from-layer="4103" from-port="2" to-layer="4108" to-port="0" /> <edge from-layer="4104" from-port="0" to-layer="4107" to-port="1" /> <edge from-layer="4105" from-port="0" to-layer="4107" to-port="2" /> <edge from-layer="4106" from-port="0" to-layer="4107" to-port="3" /> <edge from-layer="4107" from-port="5" to-layer="4108" to-port="1" /> <edge from-layer="4108" from-port="2" to-layer="4109" to-port="0" /> <edge from-layer="4109" from-port="2" to-layer="4110" to-port="1" /> <edge from-layer="4110" from-port="2" to-layer="4164" to-port="0" /> <edge from-layer="4111" from-port="0" to-layer="4112" to-port="0" /> <edge from-layer="4112" from-port="1" to-layer="4117" to-port="0" /> <edge from-layer="4113" from-port="0" to-layer="4116" to-port="1" /> <edge from-layer="4114" from-port="0" to-layer="4116" to-port="2" /> <edge from-layer="4115" from-port="0" to-layer="4116" to-port="3" /> <edge from-layer="4116" from-port="4" to-layer="4117" to-port="1" /> <edge from-layer="4117" from-port="2" to-layer="4118" to-port="0" /> <edge from-layer="4118" from-port="1" to-layer="4120" to-port="0" /> <edge from-layer="4119" from-port="0" to-layer="4120" to-port="2" /> <edge from-layer="4120" from-port="3" to-layer="4144" to-port="0" /> <edge from-layer="4121" from-port="0" to-layer="4124" to-port="1" /> <edge from-layer="4122" from-port="0" to-layer="4124" to-port="2" /> <edge from-layer="4123" from-port="0" to-layer="4124" to-port="3" /> <edge from-layer="4124" from-port="5" to-layer="4126" to-port="0" /> <edge from-layer="4125" from-port="0" to-layer="4126" to-port="1" /> <edge from-layer="4126" from-port="2" to-layer="4128" to-port="0" /> <edge from-layer="4127" from-port="0" to-layer="4128" to-port="1" /> <edge from-layer="4128" from-port="2" to-layer="4140" to-port="0" /> <edge from-layer="4128" from-port="2" to-layer="4133" to-port="0" /> <edge from-layer="4128" from-port="2" to-layer="4129" to-port="0" /> <edge from-layer="4129" from-port="2" to-layer="4143" to-port="0" /> <edge from-layer="4130" from-port="0" to-layer="4133" to-port="1" /> <edge from-layer="4131" from-port="0" to-layer="4133" to-port="2" /> <edge from-layer="4132" from-port="0" to-layer="4133" to-port="3" /> <edge from-layer="4133" from-port="5" to-layer="4136" to-port="0" /> <edge from-layer="4134" from-port="0" to-layer="4135" to-port="0" /> <edge from-layer="4135" from-port="1" to-layer="4136" to-port="1" /> <edge from-layer="4136" from-port="2" to-layer="4141" to-port="0" /> <edge from-layer="4137" from-port="0" to-layer="4140" to-port="1" /> <edge from-layer="4138" from-port="0" to-layer="4140" to-port="2" /> <edge from-layer="4139" from-port="0" to-layer="4140" to-port="3" /> <edge from-layer="4140" from-port="5" to-layer="4141" to-port="1" /> <edge from-layer="4141" from-port="2" to-layer="4142" to-port="0" /> <edge from-layer="4142" from-port="2" to-layer="4143" to-port="1" /> <edge from-layer="4143" from-port="2" to-layer="4144" to-port="1" /> <edge from-layer="4144" from-port="2" to-layer="4262" to-port="0" /> <edge from-layer="4144" from-port="2" to-layer="4164" to-port="1" /> <edge from-layer="4145" from-port="0" to-layer="4146" to-port="0" /> <edge from-layer="4146" from-port="1" to-layer="4151" to-port="0" /> <edge from-layer="4147" from-port="0" to-layer="4150" to-port="1" /> <edge from-layer="4148" from-port="0" to-layer="4150" to-port="2" /> <edge from-layer="4149" from-port="0" to-layer="4150" to-port="3" /> <edge from-layer="4150" from-port="4" to-layer="4151" to-port="1" /> <edge from-layer="4151" from-port="2" to-layer="4152" to-port="0" /> <edge from-layer="4152" from-port="1" to-layer="4154" to-port="0" /> <edge from-layer="4153" from-port="0" to-layer="4154" to-port="2" /> <edge from-layer="4154" from-port="3" to-layer="4163" to-port="0" /> <edge from-layer="4155" from-port="0" to-layer="4158" to-port="1" /> <edge from-layer="4156" from-port="0" to-layer="4158" to-port="2" /> <edge from-layer="4157" from-port="0" to-layer="4158" to-port="3" /> <edge from-layer="4158" from-port="5" to-layer="4160" to-port="0" /> <edge from-layer="4159" from-port="0" to-layer="4160" to-port="1" /> <edge from-layer="4160" from-port="2" to-layer="4162" to-port="0" /> <edge from-layer="4161" from-port="0" to-layer="4162" to-port="1" /> <edge from-layer="4162" from-port="2" to-layer="4163" to-port="1" /> <edge from-layer="4163" from-port="2" to-layer="4164" to-port="2" /> <edge from-layer="4163" from-port="2" to-layer="4261" to-port="0" /> <edge from-layer="4164" from-port="4" to-layer="4166" to-port="0" /> <edge from-layer="4165" from-port="0" to-layer="4166" to-port="1" /> <edge from-layer="4166" from-port="2" to-layer="4168" to-port="0" /> <edge from-layer="4167" from-port="0" to-layer="4168" to-port="1" /> <edge from-layer="4168" from-port="2" to-layer="4171" to-port="0" /> <edge from-layer="4169" from-port="0" to-layer="4170" to-port="0" /> <edge from-layer="4170" from-port="1" to-layer="4171" to-port="1" /> <edge from-layer="4171" from-port="2" to-layer="4172" to-port="1" /> <edge from-layer="4172" from-port="2" to-layer="4187" to-port="0" /> <edge from-layer="4172" from-port="2" to-layer="4179" to-port="0" /> <edge from-layer="4172" from-port="2" to-layer="4198" to-port="0" /> <edge from-layer="4173" from-port="0" to-layer="4174" to-port="0" /> <edge from-layer="4174" from-port="1" to-layer="4188" to-port="0" /> <edge from-layer="4175" from-port="0" to-layer="4176" to-port="0" /> <edge from-layer="4176" from-port="1" to-layer="4186" to-port="0" /> <edge from-layer="4177" from-port="0" to-layer="4178" to-port="0" /> <edge from-layer="4178" from-port="1" to-layer="4179" to-port="1" /> <edge from-layer="4179" from-port="2" to-layer="4181" to-port="0" /> <edge from-layer="4180" from-port="0" to-layer="4181" to-port="1" /> <edge from-layer="4181" from-port="2" to-layer="4184" to-port="0" /> <edge from-layer="4182" from-port="0" to-layer="4183" to-port="0" /> <edge from-layer="4183" from-port="1" to-layer="4184" to-port="1" /> <edge from-layer="4184" from-port="2" to-layer="4185" to-port="0" /> <edge from-layer="4185" from-port="1" to-layer="4186" to-port="1" /> <edge from-layer="4186" from-port="2" to-layer="4187" to-port="1" /> <edge from-layer="4187" from-port="2" to-layer="4188" to-port="1" /> <edge from-layer="4188" from-port="2" to-layer="4191" to-port="0" /> <edge from-layer="4189" from-port="0" to-layer="4190" to-port="0" /> <edge from-layer="4190" from-port="1" to-layer="4191" to-port="1" /> <edge from-layer="4191" from-port="2" to-layer="4192" to-port="0" /> <edge from-layer="4192" from-port="4" to-layer="4194" to-port="0" /> <edge from-layer="4192" from-port="3" to-layer="4193" to-port="0" /> <edge from-layer="4193" from-port="1" to-layer="4194" to-port="1" /> <edge from-layer="4194" from-port="2" to-layer="4197" to-port="0" /> <edge from-layer="4195" from-port="0" to-layer="4196" to-port="0" /> <edge from-layer="4196" from-port="1" to-layer="4197" to-port="1" /> <edge from-layer="4197" from-port="2" to-layer="4198" to-port="1" /> <edge from-layer="4198" from-port="2" to-layer="4211" to-port="0" /> <edge from-layer="4198" from-port="2" to-layer="4344" to-port="0" /> <edge from-layer="4198" from-port="2" to-layer="4203" to-port="0" /> <edge from-layer="4199" from-port="0" to-layer="4200" to-port="0" /> <edge from-layer="4200" from-port="1" to-layer="4210" to-port="0" /> <edge from-layer="4201" from-port="0" to-layer="4202" to-port="0" /> <edge from-layer="4202" from-port="1" to-layer="4203" to-port="1" /> <edge from-layer="4203" from-port="2" to-layer="4205" to-port="0" /> <edge from-layer="4204" from-port="0" to-layer="4205" to-port="1" /> <edge from-layer="4205" from-port="2" to-layer="4208" to-port="0" /> <edge from-layer="4206" from-port="0" to-layer="4207" to-port="0" /> <edge from-layer="4207" from-port="1" to-layer="4208" to-port="1" /> <edge from-layer="4208" from-port="2" to-layer="4209" to-port="0" /> <edge from-layer="4209" from-port="1" to-layer="4210" to-port="1" /> <edge from-layer="4210" from-port="2" to-layer="4211" to-port="1" /> <edge from-layer="4211" from-port="2" to-layer="4212" to-port="1" /> <edge from-layer="4212" from-port="2" to-layer="4215" to-port="0" /> <edge from-layer="4213" from-port="0" to-layer="4214" to-port="0" /> <edge from-layer="4214" from-port="1" to-layer="4215" to-port="1" /> <edge from-layer="4215" from-port="2" to-layer="4316" to-port="0" /> <edge from-layer="4215" from-port="2" to-layer="4219" to-port="0" /> <edge from-layer="4215" from-port="2" to-layer="4239" to-port="0" /> <edge from-layer="4216" from-port="0" to-layer="4219" to-port="1" /> <edge from-layer="4217" from-port="0" to-layer="4219" to-port="2" /> <edge from-layer="4218" from-port="0" to-layer="4219" to-port="3" /> <edge from-layer="4219" from-port="5" to-layer="4221" to-port="0" /> <edge from-layer="4220" from-port="0" to-layer="4221" to-port="1" /> <edge from-layer="4221" from-port="2" to-layer="4223" to-port="0" /> <edge from-layer="4222" from-port="0" to-layer="4223" to-port="1" /> <edge from-layer="4223" from-port="2" to-layer="4224" to-port="1" /> <edge from-layer="4224" from-port="2" to-layer="4336" to-port="2" /> <edge from-layer="4224" from-port="2" to-layer="4225" to-port="0" /> <edge from-layer="4226" from-port="0" to-layer="4227" to-port="0" /> <edge from-layer="4227" from-port="1" to-layer="4232" to-port="0" /> <edge from-layer="4228" from-port="0" to-layer="4231" to-port="1" /> <edge from-layer="4229" from-port="0" to-layer="4231" to-port="2" /> <edge from-layer="4230" from-port="0" to-layer="4231" to-port="3" /> <edge from-layer="4231" from-port="4" to-layer="4232" to-port="1" /> <edge from-layer="4232" from-port="2" to-layer="4233" to-port="0" /> <edge from-layer="4233" from-port="1" to-layer="4235" to-port="0" /> <edge from-layer="4234" from-port="0" to-layer="4235" to-port="2" /> <edge from-layer="4235" from-port="3" to-layer="4259" to-port="0" /> <edge from-layer="4236" from-port="0" to-layer="4239" to-port="1" /> <edge from-layer="4237" from-port="0" to-layer="4239" to-port="2" /> <edge from-layer="4238" from-port="0" to-layer="4239" to-port="3" /> <edge from-layer="4239" from-port="5" to-layer="4241" to-port="0" /> <edge from-layer="4240" from-port="0" to-layer="4241" to-port="1" /> <edge from-layer="4241" from-port="2" to-layer="4243" to-port="0" /> <edge from-layer="4242" from-port="0" to-layer="4243" to-port="1" /> <edge from-layer="4243" from-port="2" to-layer="4248" to-port="0" /> <edge from-layer="4243" from-port="2" to-layer="4255" to-port="0" /> <edge from-layer="4243" from-port="2" to-layer="4244" to-port="0" /> <edge from-layer="4244" from-port="2" to-layer="4258" to-port="0" /> <edge from-layer="4245" from-port="0" to-layer="4248" to-port="1" /> <edge from-layer="4246" from-port="0" to-layer="4248" to-port="2" /> <edge from-layer="4247" from-port="0" to-layer="4248" to-port="3" /> <edge from-layer="4248" from-port="5" to-layer="4251" to-port="0" /> <edge from-layer="4249" from-port="0" to-layer="4250" to-port="0" /> <edge from-layer="4250" from-port="1" to-layer="4251" to-port="1" /> <edge from-layer="4251" from-port="2" to-layer="4256" to-port="0" /> <edge from-layer="4252" from-port="0" to-layer="4255" to-port="1" /> <edge from-layer="4253" from-port="0" to-layer="4255" to-port="2" /> <edge from-layer="4254" from-port="0" to-layer="4255" to-port="3" /> <edge from-layer="4255" from-port="5" to-layer="4256" to-port="1" /> <edge from-layer="4256" from-port="2" to-layer="4257" to-port="0" /> <edge from-layer="4257" from-port="2" to-layer="4258" to-port="1" /> <edge from-layer="4258" from-port="2" to-layer="4259" to-port="1" /> <edge from-layer="4259" from-port="2" to-layer="4336" to-port="1" /> <edge from-layer="4259" from-port="2" to-layer="4260" to-port="0" /> <edge from-layer="4311" from-port="0" to-layer="4312" to-port="0" /> <edge from-layer="4312" from-port="1" to-layer="4384" to-port="0" /> <edge from-layer="4313" from-port="0" to-layer="4316" to-port="1" /> <edge from-layer="4314" from-port="0" to-layer="4316" to-port="2" /> <edge from-layer="4315" from-port="0" to-layer="4316" to-port="3" /> <edge from-layer="4316" from-port="5" to-layer="4318" to-port="0" /> <edge from-layer="4317" from-port="0" to-layer="4318" to-port="1" /> <edge from-layer="4318" from-port="2" to-layer="4320" to-port="0" /> <edge from-layer="4319" from-port="0" to-layer="4320" to-port="1" /> <edge from-layer="4320" from-port="2" to-layer="4321" to-port="0" /> <edge from-layer="4320" from-port="2" to-layer="4325" to-port="0" /> <edge from-layer="4320" from-port="2" to-layer="4332" to-port="0" /> <edge from-layer="4321" from-port="2" to-layer="4335" to-port="0" /> <edge from-layer="4322" from-port="0" to-layer="4325" to-port="1" /> <edge from-layer="4323" from-port="0" to-layer="4325" to-port="2" /> <edge from-layer="4324" from-port="0" to-layer="4325" to-port="3" /> <edge from-layer="4325" from-port="5" to-layer="4328" to-port="0" /> <edge from-layer="4326" from-port="0" to-layer="4327" to-port="0" /> <edge from-layer="4327" from-port="1" to-layer="4328" to-port="1" /> <edge from-layer="4328" from-port="2" to-layer="4333" to-port="0" /> <edge from-layer="4329" from-port="0" to-layer="4332" to-port="1" /> <edge from-layer="4330" from-port="0" to-layer="4332" to-port="2" /> <edge from-layer="4331" from-port="0" to-layer="4332" to-port="3" /> <edge from-layer="4332" from-port="5" to-layer="4333" to-port="1" /> <edge from-layer="4333" from-port="2" to-layer="4334" to-port="0" /> <edge from-layer="4334" from-port="2" to-layer="4335" to-port="1" /> <edge from-layer="4335" from-port="2" to-layer="4336" to-port="0" /> <edge from-layer="4336" from-port="4" to-layer="4338" to-port="0" /> <edge from-layer="4337" from-port="0" to-layer="4338" to-port="1" /> <edge from-layer="4338" from-port="2" to-layer="4340" to-port="0" /> <edge from-layer="4339" from-port="0" to-layer="4340" to-port="1" /> <edge from-layer="4340" from-port="2" to-layer="4343" to-port="0" /> <edge from-layer="4341" from-port="0" to-layer="4342" to-port="0" /> <edge from-layer="4342" from-port="1" to-layer="4343" to-port="1" /> <edge from-layer="4343" from-port="2" to-layer="4344" to-port="1" /> <edge from-layer="4344" from-port="2" to-layer="4359" to-port="0" /> <edge from-layer="4344" from-port="2" to-layer="4370" to-port="0" /> <edge from-layer="4344" from-port="2" to-layer="4351" to-port="0" /> <edge from-layer="4345" from-port="0" to-layer="4346" to-port="0" /> <edge from-layer="4346" from-port="1" to-layer="4360" to-port="0" /> <edge from-layer="4347" from-port="0" to-layer="4348" to-port="0" /> <edge from-layer="4348" from-port="1" to-layer="4358" to-port="0" /> <edge from-layer="4349" from-port="0" to-layer="4350" to-port="0" /> <edge from-layer="4350" from-port="1" to-layer="4351" to-port="1" /> <edge from-layer="4351" from-port="2" to-layer="4353" to-port="0" /> <edge from-layer="4352" from-port="0" to-layer="4353" to-port="1" /> <edge from-layer="4353" from-port="2" to-layer="4356" to-port="0" /> <edge from-layer="4354" from-port="0" to-layer="4355" to-port="0" /> <edge from-layer="4355" from-port="1" to-layer="4356" to-port="1" /> <edge from-layer="4356" from-port="2" to-layer="4357" to-port="0" /> <edge from-layer="4357" from-port="1" to-layer="4358" to-port="1" /> <edge from-layer="4358" from-port="2" to-layer="4359" to-port="1" /> <edge from-layer="4359" from-port="2" to-layer="4360" to-port="1" /> <edge from-layer="4360" from-port="2" to-layer="4363" to-port="0" /> <edge from-layer="4361" from-port="0" to-layer="4362" to-port="0" /> <edge from-layer="4362" from-port="1" to-layer="4363" to-port="1" /> <edge from-layer="4363" from-port="2" to-layer="4364" to-port="0" /> <edge from-layer="4364" from-port="3" to-layer="4365" to-port="0" /> <edge from-layer="4364" from-port="4" to-layer="4366" to-port="0" /> <edge from-layer="4365" from-port="1" to-layer="4366" to-port="1" /> <edge from-layer="4366" from-port="2" to-layer="4369" to-port="0" /> <edge from-layer="4367" from-port="0" to-layer="4368" to-port="0" /> <edge from-layer="4368" from-port="1" to-layer="4369" to-port="1" /> <edge from-layer="4369" from-port="2" to-layer="4370" to-port="1" /> <edge from-layer="4370" from-port="2" to-layer="4375" to-port="0" /> <edge from-layer="4370" from-port="2" to-layer="4383" to-port="0" /> <edge from-layer="4371" from-port="0" to-layer="4372" to-port="0" /> <edge from-layer="4372" from-port="1" to-layer="4382" to-port="0" /> <edge from-layer="4373" from-port="0" to-layer="4374" to-port="0" /> <edge from-layer="4374" from-port="1" to-layer="4375" to-port="1" /> <edge from-layer="4375" from-port="2" to-layer="4377" to-port="0" /> <edge from-layer="4376" from-port="0" to-layer="4377" to-port="1" /> <edge from-layer="4377" from-port="2" to-layer="4380" to-port="0" /> <edge from-layer="4378" from-port="0" to-layer="4379" to-port="0" /> <edge from-layer="4379" from-port="1" to-layer="4380" to-port="1" /> <edge from-layer="4380" from-port="2" to-layer="4381" to-port="0" /> <edge from-layer="4381" from-port="1" to-layer="4382" to-port="1" /> <edge from-layer="4382" from-port="2" to-layer="4383" to-port="1" /> <edge from-layer="4383" from-port="2" to-layer="4384" to-port="1" /> <edge from-layer="4384" from-port="2" to-layer="4387" to-port="0" /> <edge from-layer="4385" from-port="0" to-layer="4386" to-port="0" /> <edge from-layer="4386" from-port="1" to-layer="4387" to-port="1" /> <edge from-layer="4387" from-port="2" to-layer="4388" to-port="0" /> </edges> <rt_info> <Runtime_version value="2025.0.0-17933-815af98acd8-releases/2025/0" /> <conversion_parameters> <framework value="pytorch" /> <is_python_object value="True" /> </conversion_parameters> <optimum> <optimum_intel_version value="1.22.0.dev0+753f84d" /> <optimum_version value="1.24.0.dev0" /> <pytorch_version value="2.5.0+cpu" /> <transformers_version value="4.45.0" /> </optimum> <runtime_options> <ACTIVATIONS_SCALE_FACTOR value="8.0" /> <KV_CACHE_PRECISION value="f16" /> </runtime_options> </rt_info> </net>