pytorch2.9.1:L o/rotary/Constant_output_0/rotary/Constant"Constant*6 value**B/rotary/Constant_attr::valueJ D position_ids/rotary/Cast_output_0 /rotary/Cast"Cast* to /rotary/Constant_1_output_0/rotary/Constant_1"Constant*B value*6B/rotary/Constant_1_attr::valueJ z /rotary/Cast_output_0 /rotary/Constant_1_output_0/rotary/Reshape_output_0/rotary/Reshape"Reshape* allowzero /rotary/Constant_2_output_0/rotary/Constant_2"Constant* value*@B/rotary/Constant_2_attr::valueJ?ׯ]???=&??S>>>>5>#r>GR>6>@>w>==xY= =M=Uf=?vG=,=H==TO;w3; i;o;(:\:ɮ:\:o:c:D:D;*:j:O9%9t9`˥9r9x9SW9Sw:9y!9r 9,8 _ /rotary/Reshape_output_0 /rotary/Constant_2_output_0/rotary/Mul_output_0 /rotary/Mul"Mul > /rotary/Mul_output_0/rotary/Cos_output_0 /rotary/Cos"Cos > /rotary/Mul_output_0/rotary/Sin_output_0 /rotary/Sin"Sin u/rotary/Constant_3_output_0/rotary/Constant_3"Constant*8 value*,B/rotary/Constant_3_attr::valueJ w/rotary/Constant_4_output_0/rotary/Constant_4"Constant*: value*.B/rotary/Constant_4_attr::valueJ m /rotary/Cos_output_0 /rotary/Constant_4_output_0/rotary/Unsqueeze_output_0/rotary/Unsqueeze" Unsqueeze w/rotary/Constant_5_output_0/rotary/Constant_5"Constant*: value*.B/rotary/Constant_5_attr::valueJ q /rotary/Sin_output_0 /rotary/Constant_5_output_0/rotary/Unsqueeze_1_output_0/rotary/Unsqueeze_1" Unsqueeze x /rotary/Unsqueeze_output_0 /rotary/Unsqueeze_1_output_0/rotary/Concat_output_0/rotary/Concat"Concat* axis } /rotary/Concat_output_0 /rotary/Concat_output_0/rotary/Concat_1_output_0/rotary/Concat_1"Concat* axis u/rotary/Constant_6_output_0/rotary/Constant_6"Constant*8 value*,B/rotary/Constant_6_attr::valueJ w/rotary/Constant_7_output_0/rotary/Constant_7"Constant*: value*.B/rotary/Constant_7_attr::valueJ v /rotary/Concat_1_output_0 /rotary/Constant_7_output_0/rotary/Unsqueeze_2_output_0/rotary/Unsqueeze_2" Unsqueeze u/rotary/Constant_8_output_0/rotary/Constant_8"Constant*8 value*,B/rotary/Constant_8_attr::valueJ w/rotary/Constant_9_output_0/rotary/Constant_9"Constant*: value*.B/rotary/Constant_9_attr::valueJ y /rotary/Unsqueeze_2_output_0 /rotary/Constant_9_output_0/rotary/Unsqueeze_3_output_0/rotary/Unsqueeze_3" Unsqueeze ^ past_key_values /rotary/Constant_3_output_0/Gather_output_0/Gather"Gather* axis /blocks.0/Constant_output_0/blocks.0/Constant"Constant*J value*>B/blocks.0/Constant_attr::valueJ r input_ids /blocks.0/Constant_output_0/blocks.0/Reshape_output_0/blocks.0/Reshape"Reshape* allowzero v /blocks.0/Reshape_output_0'/blocks.0/input_layernorm/Cast_output_0/blocks.0/input_layernorm/Cast"Cast* to +/blocks.0/input_layernorm/Constant_output_0"/blocks.0/input_layernorm/Constant"Constant*D value*8B./blocks.0/input_layernorm/Constant_attr::valueJ@  '/blocks.0/input_layernorm/Cast_output_0 +/blocks.0/input_layernorm/Constant_output_0&/blocks.0/input_layernorm/Pow_output_0/blocks.0/input_layernorm/Pow"Pow  &/blocks.0/input_layernorm/Pow_output_0-/blocks.0/input_layernorm/ReduceMean_output_0$/blocks.0/input_layernorm/ReduceMean" ReduceMean* axes@* keepdims -/blocks.0/input_layernorm/Constant_1_output_0$/blocks.0/input_layernorm/Constant_1"Constant*F value*:B0/blocks.0/input_layernorm/Constant_1_attr::valueJ75  -/blocks.0/input_layernorm/ReduceMean_output_0 -/blocks.0/input_layernorm/Constant_1_output_0&/blocks.0/input_layernorm/Add_output_0/blocks.0/input_layernorm/Add"Add w &/blocks.0/input_layernorm/Add_output_0'/blocks.0/input_layernorm/Sqrt_output_0/blocks.0/input_layernorm/Sqrt"Sqrt -/blocks.0/input_layernorm/Constant_2_output_0$/blocks.0/input_layernorm/Constant_2"Constant*F value*:B0/blocks.0/input_layernorm/Constant_2_attr::valueJ?  -/blocks.0/input_layernorm/Constant_2_output_0 '/blocks.0/input_layernorm/Sqrt_output_0&/blocks.0/input_layernorm/Div_output_0/blocks.0/input_layernorm/Div"Div  '/blocks.0/input_layernorm/Cast_output_0)/blocks.0/input_layernorm/Cast_1_output_0 /blocks.0/input_layernorm/Cast_1"Cast* to  )/blocks.0/input_layernorm/Cast_1_output_0 &/blocks.0/input_layernorm/Div_output_0&/blocks.0/input_layernorm/Mul_output_0/blocks.0/input_layernorm/Mul"Mul  &/blocks.0/input_layernorm/Mul_output_0 blocks.0.input_layernorm.weight(/blocks.0/input_layernorm/Mul_1_output_0/blocks.0/input_layernorm/Mul_1"Mul  (/blocks.0/input_layernorm/Mul_1_output_0)/blocks.0/input_layernorm/Cast_2_output_0 /blocks.0/input_layernorm/Cast_2"Cast* to q )/blocks.0/input_layernorm/Cast_2_output_0"/blocks.0/self_attn/Shape_output_0/blocks.0/self_attn/Shape"Shape %/blocks.0/self_attn/Constant_output_0/blocks.0/self_attn/Constant"Constant*B value*6B(/blocks.0/self_attn/Constant_attr::valueJ  "/blocks.0/self_attn/Shape_output_0 %/blocks.0/self_attn/Constant_output_0#/blocks.0/self_attn/Gather_output_0/blocks.0/self_attn/Gather"Gather* axis u )/blocks.0/input_layernorm/Cast_2_output_0$/blocks.0/self_attn/Shape_1_output_0/blocks.0/self_attn/Shape_1"Shape '/blocks.0/self_attn/Constant_1_output_0/blocks.0/self_attn/Constant_1"Constant*D value*8B*/blocks.0/self_attn/Constant_1_attr::valueJ  $/blocks.0/self_attn/Shape_1_output_0 '/blocks.0/self_attn/Constant_1_output_0%/blocks.0/self_attn/Gather_1_output_0/blocks.0/self_attn/Gather_1"Gather* axis  )/blocks.0/input_layernorm/Cast_2_output_0 onnx::MatMul_8565*/blocks.0/self_attn/q_proj/MatMul_output_0!/blocks.0/self_attn/q_proj/MatMul"MatMul  )/blocks.0/input_layernorm/Cast_2_output_0 onnx::MatMul_8566*/blocks.0/self_attn/k_proj/MatMul_output_0!/blocks.0/self_attn/k_proj/MatMul"MatMul  )/blocks.0/input_layernorm/Cast_2_output_0 onnx::MatMul_8567*/blocks.0/self_attn/v_proj/MatMul_output_0!/blocks.0/self_attn/v_proj/MatMul"MatMul '/blocks.0/self_attn/Constant_2_output_0/blocks.0/self_attn/Constant_2"Constant*D value*8B*/blocks.0/self_attn/Constant_2_attr::valueJ eonnx::Unsqueeze_368 Constant_2551"Constant*5 value*)BConstant_2551_attr::valueJ  #/blocks.0/self_attn/Gather_output_0 onnx::Unsqueeze_368&/blocks.0/self_attn/Unsqueeze_output_0/blocks.0/self_attn/Unsqueeze" Unsqueeze eonnx::Unsqueeze_370 Constant_2553"Constant*5 value*)BConstant_2553_attr::valueJ  %/blocks.0/self_attn/Gather_1_output_0 onnx::Unsqueeze_370(/blocks.0/self_attn/Unsqueeze_1_output_0/blocks.0/self_attn/Unsqueeze_1" Unsqueeze '/blocks.0/self_attn/Constant_3_output_0/blocks.0/self_attn/Constant_3"Constant*F value*:B*/blocks.0/self_attn/Constant_3_attr::valueJ '/blocks.0/self_attn/Constant_4_output_0/blocks.0/self_attn/Constant_4"Constant*F value*:B*/blocks.0/self_attn/Constant_4_attr::valueJ  &/blocks.0/self_attn/Unsqueeze_output_0 (/blocks.0/self_attn/Unsqueeze_1_output_0 '/blocks.0/self_attn/Constant_3_output_0 '/blocks.0/self_attn/Constant_4_output_0#/blocks.0/self_attn/Concat_output_0/blocks.0/self_attn/Concat"Concat* axis  */blocks.0/self_attn/q_proj/MatMul_output_0 #/blocks.0/self_attn/Concat_output_0$/blocks.0/self_attn/Reshape_output_0/blocks.0/self_attn/Reshape"Reshape* allowzero '/blocks.0/self_attn/Constant_5_output_0/blocks.0/self_attn/Constant_5"Constant*D value*8B*/blocks.0/self_attn/Constant_5_attr::valueJ eonnx::Unsqueeze_379 Constant_2560"Constant*5 value*)BConstant_2560_attr::valueJ  #/blocks.0/self_attn/Gather_output_0 onnx::Unsqueeze_379(/blocks.0/self_attn/Unsqueeze_2_output_0/blocks.0/self_attn/Unsqueeze_2" Unsqueeze eonnx::Unsqueeze_381 Constant_2562"Constant*5 value*)BConstant_2562_attr::valueJ  %/blocks.0/self_attn/Gather_1_output_0 onnx::Unsqueeze_381(/blocks.0/self_attn/Unsqueeze_3_output_0/blocks.0/self_attn/Unsqueeze_3" Unsqueeze '/blocks.0/self_attn/Constant_6_output_0/blocks.0/self_attn/Constant_6"Constant*F value*:B*/blocks.0/self_attn/Constant_6_attr::valueJ '/blocks.0/self_attn/Constant_7_output_0/blocks.0/self_attn/Constant_7"Constant*F value*:B*/blocks.0/self_attn/Constant_7_attr::valueJ  (/blocks.0/self_attn/Unsqueeze_2_output_0 (/blocks.0/self_attn/Unsqueeze_3_output_0 '/blocks.0/self_attn/Constant_6_output_0 '/blocks.0/self_attn/Constant_7_output_0%/blocks.0/self_attn/Concat_1_output_0/blocks.0/self_attn/Concat_1"Concat* axis eonnx::Unsqueeze_388 Constant_2567"Constant*5 value*)BConstant_2567_attr::valueJ  #/blocks.0/self_attn/Gather_output_0 onnx::Unsqueeze_388(/blocks.0/self_attn/Unsqueeze_4_output_0/blocks.0/self_attn/Unsqueeze_4" Unsqueeze eonnx::Unsqueeze_390 Constant_2569"Constant*5 value*)BConstant_2569_attr::valueJ  %/blocks.0/self_attn/Gather_1_output_0 onnx::Unsqueeze_390(/blocks.0/self_attn/Unsqueeze_5_output_0/blocks.0/self_attn/Unsqueeze_5" Unsqueeze '/blocks.0/self_attn/Constant_8_output_0/blocks.0/self_attn/Constant_8"Constant*F value*:B*/blocks.0/self_attn/Constant_8_attr::valueJ '/blocks.0/self_attn/Constant_9_output_0/blocks.0/self_attn/Constant_9"Constant*F value*:B*/blocks.0/self_attn/Constant_9_attr::valueJ  (/blocks.0/self_attn/Unsqueeze_4_output_0 (/blocks.0/self_attn/Unsqueeze_5_output_0 '/blocks.0/self_attn/Constant_8_output_0 '/blocks.0/self_attn/Constant_9_output_0%/blocks.0/self_attn/Concat_2_output_0/blocks.0/self_attn/Concat_2"Concat* axis  */blocks.0/self_attn/k_proj/MatMul_output_0 %/blocks.0/self_attn/Concat_1_output_0&/blocks.0/self_attn/Reshape_1_output_0/blocks.0/self_attn/Reshape_1"Reshape* allowzero  */blocks.0/self_attn/v_proj/MatMul_output_0 %/blocks.0/self_attn/Concat_2_output_0&/blocks.0/self_attn/Reshape_2_output_0/blocks.0/self_attn/Reshape_2"Reshape* allowzero  $/blocks.0/self_attn/Reshape_output_0(/blocks.0/self_attn/q_norm/Cast_output_0/blocks.0/self_attn/q_norm/Cast"Cast* to ,/blocks.0/self_attn/q_norm/Constant_output_0#/blocks.0/self_attn/q_norm/Constant"Constant*E value*9B//blocks.0/self_attn/q_norm/Constant_attr::valueJ@  (/blocks.0/self_attn/q_norm/Cast_output_0 ,/blocks.0/self_attn/q_norm/Constant_output_0'/blocks.0/self_attn/q_norm/Pow_output_0/blocks.0/self_attn/q_norm/Pow"Pow  '/blocks.0/self_attn/q_norm/Pow_output_0./blocks.0/self_attn/q_norm/ReduceMean_output_0%/blocks.0/self_attn/q_norm/ReduceMean" ReduceMean* axes@* keepdims ./blocks.0/self_attn/q_norm/Constant_1_output_0%/blocks.0/self_attn/q_norm/Constant_1"Constant*G value*;B1/blocks.0/self_attn/q_norm/Constant_1_attr::valueJ75  ./blocks.0/self_attn/q_norm/ReduceMean_output_0 ./blocks.0/self_attn/q_norm/Constant_1_output_0'/blocks.0/self_attn/q_norm/Add_output_0/blocks.0/self_attn/q_norm/Add"Add z '/blocks.0/self_attn/q_norm/Add_output_0(/blocks.0/self_attn/q_norm/Sqrt_output_0/blocks.0/self_attn/q_norm/Sqrt"Sqrt ./blocks.0/self_attn/q_norm/Constant_2_output_0%/blocks.0/self_attn/q_norm/Constant_2"Constant*G value*;B1/blocks.0/self_attn/q_norm/Constant_2_attr::valueJ?  ./blocks.0/self_attn/q_norm/Constant_2_output_0 (/blocks.0/self_attn/q_norm/Sqrt_output_0'/blocks.0/self_attn/q_norm/Div_output_0/blocks.0/self_attn/q_norm/Div"Div  (/blocks.0/self_attn/q_norm/Cast_output_0*/blocks.0/self_attn/q_norm/Cast_1_output_0!/blocks.0/self_attn/q_norm/Cast_1"Cast* to  */blocks.0/self_attn/q_norm/Cast_1_output_0 '/blocks.0/self_attn/q_norm/Div_output_0'/blocks.0/self_attn/q_norm/Mul_output_0/blocks.0/self_attn/q_norm/Mul"Mul  '/blocks.0/self_attn/q_norm/Mul_output_0 blocks.0.self_attn.q_norm.weight)/blocks.0/self_attn/q_norm/Mul_1_output_0 /blocks.0/self_attn/q_norm/Mul_1"Mul  )/blocks.0/self_attn/q_norm/Mul_1_output_0*/blocks.0/self_attn/q_norm/Cast_2_output_0!/blocks.0/self_attn/q_norm/Cast_2"Cast* to  &/blocks.0/self_attn/Reshape_1_output_0(/blocks.0/self_attn/k_norm/Cast_output_0/blocks.0/self_attn/k_norm/Cast"Cast* to ,/blocks.0/self_attn/k_norm/Constant_output_0#/blocks.0/self_attn/k_norm/Constant"Constant*E value*9B//blocks.0/self_attn/k_norm/Constant_attr::valueJ@  (/blocks.0/self_attn/k_norm/Cast_output_0 ,/blocks.0/self_attn/k_norm/Constant_output_0'/blocks.0/self_attn/k_norm/Pow_output_0/blocks.0/self_attn/k_norm/Pow"Pow  '/blocks.0/self_attn/k_norm/Pow_output_0./blocks.0/self_attn/k_norm/ReduceMean_output_0%/blocks.0/self_attn/k_norm/ReduceMean" ReduceMean* axes@* keepdims ./blocks.0/self_attn/k_norm/Constant_1_output_0%/blocks.0/self_attn/k_norm/Constant_1"Constant*G value*;B1/blocks.0/self_attn/k_norm/Constant_1_attr::valueJ75  ./blocks.0/self_attn/k_norm/ReduceMean_output_0 ./blocks.0/self_attn/k_norm/Constant_1_output_0'/blocks.0/self_attn/k_norm/Add_output_0/blocks.0/self_attn/k_norm/Add"Add z '/blocks.0/self_attn/k_norm/Add_output_0(/blocks.0/self_attn/k_norm/Sqrt_output_0/blocks.0/self_attn/k_norm/Sqrt"Sqrt ./blocks.0/self_attn/k_norm/Constant_2_output_0%/blocks.0/self_attn/k_norm/Constant_2"Constant*G value*;B1/blocks.0/self_attn/k_norm/Constant_2_attr::valueJ?  ./blocks.0/self_attn/k_norm/Constant_2_output_0 (/blocks.0/self_attn/k_norm/Sqrt_output_0'/blocks.0/self_attn/k_norm/Div_output_0/blocks.0/self_attn/k_norm/Div"Div  (/blocks.0/self_attn/k_norm/Cast_output_0*/blocks.0/self_attn/k_norm/Cast_1_output_0!/blocks.0/self_attn/k_norm/Cast_1"Cast* to  */blocks.0/self_attn/k_norm/Cast_1_output_0 '/blocks.0/self_attn/k_norm/Div_output_0'/blocks.0/self_attn/k_norm/Mul_output_0/blocks.0/self_attn/k_norm/Mul"Mul  '/blocks.0/self_attn/k_norm/Mul_output_0 blocks.0.self_attn.k_norm.weight)/blocks.0/self_attn/k_norm/Mul_1_output_0 /blocks.0/self_attn/k_norm/Mul_1"Mul  )/blocks.0/self_attn/k_norm/Mul_1_output_0*/blocks.0/self_attn/k_norm/Cast_2_output_0!/blocks.0/self_attn/k_norm/Cast_2"Cast* to  /rotary/Unsqueeze_3_output_0 /rotary/Constant_3_output_0%/blocks.0/self_attn/Gather_2_output_0/blocks.0/self_attn/Gather_2"Gather* axis  /rotary/Unsqueeze_3_output_0 /rotary/Constant_8_output_0%/blocks.0/self_attn/Gather_3_output_0/blocks.0/self_attn/Gather_3"Gather* axis  */blocks.0/self_attn/q_norm/Cast_2_output_0 %/blocks.0/self_attn/Gather_2_output_0 /blocks.0/self_attn/Mul_output_0/blocks.0/self_attn/Mul"Mul (/blocks.0/self_attn/Constant_10_output_0/blocks.0/self_attn/Constant_10"Constant*E value*9B+/blocks.0/self_attn/Constant_10_attr::valueJ v */blocks.0/self_attn/q_norm/Cast_2_output_0$/blocks.0/self_attn/Shape_2_output_0/blocks.0/self_attn/Shape_2"Shape (/blocks.0/self_attn/Constant_11_output_0/blocks.0/self_attn/Constant_11"Constant*E value*9B+/blocks.0/self_attn/Constant_11_attr::valueJ  $/blocks.0/self_attn/Shape_2_output_0 (/blocks.0/self_attn/Constant_11_output_0%/blocks.0/self_attn/Gather_4_output_0/blocks.0/self_attn/Gather_4"Gather* axis (/blocks.0/self_attn/Constant_12_output_0/blocks.0/self_attn/Constant_12"Constant*E value*9B+/blocks.0/self_attn/Constant_12_attr::valueJ  %/blocks.0/self_attn/Gather_4_output_0 (/blocks.0/self_attn/Constant_12_output_0 /blocks.0/self_attn/Div_output_0/blocks.0/self_attn/Div"Div p /blocks.0/self_attn/Div_output_0!/blocks.0/self_attn/Cast_output_0/blocks.0/self_attn/Cast"Cast* to u !/blocks.0/self_attn/Cast_output_0#/blocks.0/self_attn/Cast_1_output_0/blocks.0/self_attn/Cast_1"Cast* to (/blocks.0/self_attn/Constant_13_output_0/blocks.0/self_attn/Constant_13"Constant*G value*;B+/blocks.0/self_attn/Constant_13_attr::valueJ (/blocks.0/self_attn/Constant_14_output_0/blocks.0/self_attn/Constant_14"Constant*G value*;B+/blocks.0/self_attn/Constant_14_attr::valueJ (/blocks.0/self_attn/Constant_15_output_0/blocks.0/self_attn/Constant_15"Constant*G value*;B+/blocks.0/self_attn/Constant_15_attr::valueJ  #/blocks.0/self_attn/Cast_1_output_0 (/blocks.0/self_attn/Constant_15_output_0(/blocks.0/self_attn/Unsqueeze_6_output_0/blocks.0/self_attn/Unsqueeze_6" Unsqueeze (/blocks.0/self_attn/Constant_16_output_0/blocks.0/self_attn/Constant_16"Constant*G value*;B+/blocks.0/self_attn/Constant_16_attr::valueJ  */blocks.0/self_attn/q_norm/Cast_2_output_0 (/blocks.0/self_attn/Constant_14_output_0 (/blocks.0/self_attn/Unsqueeze_6_output_0 (/blocks.0/self_attn/Constant_13_output_0 (/blocks.0/self_attn/Constant_16_output_0"/blocks.0/self_attn/Slice_output_0/blocks.0/self_attn/Slice"Slice (/blocks.0/self_attn/Constant_17_output_0/blocks.0/self_attn/Constant_17"Constant*G value*;B+/blocks.0/self_attn/Constant_17_attr::valueJ (/blocks.0/self_attn/Constant_18_output_0/blocks.0/self_attn/Constant_18"Constant*G value*;B+/blocks.0/self_attn/Constant_18_attr::valueJ  #/blocks.0/self_attn/Cast_1_output_0 (/blocks.0/self_attn/Constant_18_output_0(/blocks.0/self_attn/Unsqueeze_7_output_0/blocks.0/self_attn/Unsqueeze_7" Unsqueeze (/blocks.0/self_attn/Constant_19_output_0/blocks.0/self_attn/Constant_19"Constant*G value*;B+/blocks.0/self_attn/Constant_19_attr::valueJ (/blocks.0/self_attn/Constant_20_output_0/blocks.0/self_attn/Constant_20"Constant*G value*;B+/blocks.0/self_attn/Constant_20_attr::valueJ  */blocks.0/self_attn/q_norm/Cast_2_output_0 (/blocks.0/self_attn/Unsqueeze_7_output_0 (/blocks.0/self_attn/Constant_19_output_0 (/blocks.0/self_attn/Constant_17_output_0 (/blocks.0/self_attn/Constant_20_output_0$/blocks.0/self_attn/Slice_1_output_0/blocks.0/self_attn/Slice_1"Slice f $/blocks.0/self_attn/Slice_1_output_0 /blocks.0/self_attn/Neg_output_0/blocks.0/self_attn/Neg"Neg  /blocks.0/self_attn/Neg_output_0 "/blocks.0/self_attn/Slice_output_0%/blocks.0/self_attn/Concat_3_output_0/blocks.0/self_attn/Concat_3"Concat* axis  %/blocks.0/self_attn/Concat_3_output_0 %/blocks.0/self_attn/Gather_3_output_0"/blocks.0/self_attn/Mul_1_output_0/blocks.0/self_attn/Mul_1"Mul  /blocks.0/self_attn/Mul_output_0 "/blocks.0/self_attn/Mul_1_output_0 /blocks.0/self_attn/Add_output_0/blocks.0/self_attn/Add"Add  */blocks.0/self_attn/k_norm/Cast_2_output_0 %/blocks.0/self_attn/Gather_2_output_0"/blocks.0/self_attn/Mul_2_output_0/blocks.0/self_attn/Mul_2"Mul v */blocks.0/self_attn/k_norm/Cast_2_output_0$/blocks.0/self_attn/Shape_3_output_0/blocks.0/self_attn/Shape_3"Shape (/blocks.0/self_attn/Constant_21_output_0/blocks.0/self_attn/Constant_21"Constant*E value*9B+/blocks.0/self_attn/Constant_21_attr::valueJ  $/blocks.0/self_attn/Shape_3_output_0 (/blocks.0/self_attn/Constant_21_output_0%/blocks.0/self_attn/Gather_5_output_0/blocks.0/self_attn/Gather_5"Gather* axis (/blocks.0/self_attn/Constant_22_output_0/blocks.0/self_attn/Constant_22"Constant*E value*9B+/blocks.0/self_attn/Constant_22_attr::valueJ  %/blocks.0/self_attn/Gather_5_output_0 (/blocks.0/self_attn/Constant_22_output_0"/blocks.0/self_attn/Div_1_output_0/blocks.0/self_attn/Div_1"Div v "/blocks.0/self_attn/Div_1_output_0#/blocks.0/self_attn/Cast_2_output_0/blocks.0/self_attn/Cast_2"Cast* to w #/blocks.0/self_attn/Cast_2_output_0#/blocks.0/self_attn/Cast_3_output_0/blocks.0/self_attn/Cast_3"Cast* to (/blocks.0/self_attn/Constant_23_output_0/blocks.0/self_attn/Constant_23"Constant*G value*;B+/blocks.0/self_attn/Constant_23_attr::valueJ (/blocks.0/self_attn/Constant_24_output_0/blocks.0/self_attn/Constant_24"Constant*G value*;B+/blocks.0/self_attn/Constant_24_attr::valueJ (/blocks.0/self_attn/Constant_25_output_0/blocks.0/self_attn/Constant_25"Constant*G value*;B+/blocks.0/self_attn/Constant_25_attr::valueJ  #/blocks.0/self_attn/Cast_3_output_0 (/blocks.0/self_attn/Constant_25_output_0(/blocks.0/self_attn/Unsqueeze_8_output_0/blocks.0/self_attn/Unsqueeze_8" Unsqueeze (/blocks.0/self_attn/Constant_26_output_0/blocks.0/self_attn/Constant_26"Constant*G value*;B+/blocks.0/self_attn/Constant_26_attr::valueJ  */blocks.0/self_attn/k_norm/Cast_2_output_0 (/blocks.0/self_attn/Constant_24_output_0 (/blocks.0/self_attn/Unsqueeze_8_output_0 (/blocks.0/self_attn/Constant_23_output_0 (/blocks.0/self_attn/Constant_26_output_0$/blocks.0/self_attn/Slice_2_output_0/blocks.0/self_attn/Slice_2"Slice (/blocks.0/self_attn/Constant_27_output_0/blocks.0/self_attn/Constant_27"Constant*G value*;B+/blocks.0/self_attn/Constant_27_attr::valueJ (/blocks.0/self_attn/Constant_28_output_0/blocks.0/self_attn/Constant_28"Constant*G value*;B+/blocks.0/self_attn/Constant_28_attr::valueJ  #/blocks.0/self_attn/Cast_3_output_0 (/blocks.0/self_attn/Constant_28_output_0(/blocks.0/self_attn/Unsqueeze_9_output_0/blocks.0/self_attn/Unsqueeze_9" Unsqueeze (/blocks.0/self_attn/Constant_29_output_0/blocks.0/self_attn/Constant_29"Constant*G value*;B+/blocks.0/self_attn/Constant_29_attr::valueJ (/blocks.0/self_attn/Constant_30_output_0/blocks.0/self_attn/Constant_30"Constant*G value*;B+/blocks.0/self_attn/Constant_30_attr::valueJ  */blocks.0/self_attn/k_norm/Cast_2_output_0 (/blocks.0/self_attn/Unsqueeze_9_output_0 (/blocks.0/self_attn/Constant_29_output_0 (/blocks.0/self_attn/Constant_27_output_0 (/blocks.0/self_attn/Constant_30_output_0$/blocks.0/self_attn/Slice_3_output_0/blocks.0/self_attn/Slice_3"Slice j $/blocks.0/self_attn/Slice_3_output_0"/blocks.0/self_attn/Neg_1_output_0/blocks.0/self_attn/Neg_1"Neg  "/blocks.0/self_attn/Neg_1_output_0 $/blocks.0/self_attn/Slice_2_output_0%/blocks.0/self_attn/Concat_4_output_0/blocks.0/self_attn/Concat_4"Concat* axis  %/blocks.0/self_attn/Concat_4_output_0 %/blocks.0/self_attn/Gather_3_output_0"/blocks.0/self_attn/Mul_3_output_0/blocks.0/self_attn/Mul_3"Mul  "/blocks.0/self_attn/Mul_2_output_0 "/blocks.0/self_attn/Mul_3_output_0"/blocks.0/self_attn/Add_1_output_0/blocks.0/self_attn/Add_1"Add  /Gather_output_0 /rotary/Constant_3_output_0%/blocks.0/self_attn/Gather_6_output_0/blocks.0/self_attn/Gather_6"Gather* axis  /Gather_output_0 /rotary/Constant_8_output_0%/blocks.0/self_attn/Gather_7_output_0/blocks.0/self_attn/Gather_7"Gather* axis  %/blocks.0/self_attn/Gather_6_output_0 "/blocks.0/self_attn/Add_1_output_0%/blocks.0/self_attn/Concat_5_output_0/blocks.0/self_attn/Concat_5"Concat* axis  %/blocks.0/self_attn/Gather_7_output_0 &/blocks.0/self_attn/Reshape_2_output_0%/blocks.0/self_attn/Concat_6_output_0/blocks.0/self_attn/Concat_6"Concat* axis (/blocks.0/self_attn/Constant_31_output_0/blocks.0/self_attn/Constant_31"Constant*G value*;B+/blocks.0/self_attn/Constant_31_attr::valueJ  %/blocks.0/self_attn/Concat_5_output_0 (/blocks.0/self_attn/Constant_31_output_0)/blocks.0/self_attn/Unsqueeze_10_output_0 /blocks.0/self_attn/Unsqueeze_10" Unsqueeze (/blocks.0/self_attn/Constant_32_output_0/blocks.0/self_attn/Constant_32"Constant*G value*;B+/blocks.0/self_attn/Constant_32_attr::valueJ  %/blocks.0/self_attn/Concat_6_output_0 (/blocks.0/self_attn/Constant_32_output_0)/blocks.0/self_attn/Unsqueeze_11_output_0 /blocks.0/self_attn/Unsqueeze_11" Unsqueeze  )/blocks.0/self_attn/Unsqueeze_10_output_0 )/blocks.0/self_attn/Unsqueeze_11_output_0%/blocks.0/self_attn/Concat_7_output_0/blocks.0/self_attn/Concat_7"Concat* axis  /blocks.0/self_attn/Add_output_0&/blocks.0/self_attn/Transpose_output_0/blocks.0/self_attn/Transpose" Transpose* perm@@@@  %/blocks.0/self_attn/Concat_5_output_0(/blocks.0/self_attn/Transpose_1_output_0/blocks.0/self_attn/Transpose_1" Transpose* perm@@@@  %/blocks.0/self_attn/Concat_6_output_0(/blocks.0/self_attn/Transpose_2_output_0/blocks.0/self_attn/Transpose_2" Transpose* perm@@@@ t (/blocks.0/self_attn/Transpose_1_output_0$/blocks.0/self_attn/Shape_4_output_0/blocks.0/self_attn/Shape_4"Shape (/blocks.0/self_attn/Constant_33_output_0/blocks.0/self_attn/Constant_33"Constant*E value*9B+/blocks.0/self_attn/Constant_33_attr::valueJ  $/blocks.0/self_attn/Shape_4_output_0 (/blocks.0/self_attn/Constant_33_output_0%/blocks.0/self_attn/Gather_8_output_0/blocks.0/self_attn/Gather_8"Gather* axis t (/blocks.0/self_attn/Transpose_1_output_0$/blocks.0/self_attn/Shape_5_output_0/blocks.0/self_attn/Shape_5"Shape (/blocks.0/self_attn/Constant_34_output_0/blocks.0/self_attn/Constant_34"Constant*E value*9B+/blocks.0/self_attn/Constant_34_attr::valueJ  $/blocks.0/self_attn/Shape_5_output_0 (/blocks.0/self_attn/Constant_34_output_0%/blocks.0/self_attn/Gather_9_output_0/blocks.0/self_attn/Gather_9"Gather* axis t (/blocks.0/self_attn/Transpose_1_output_0$/blocks.0/self_attn/Shape_6_output_0/blocks.0/self_attn/Shape_6"Shape (/blocks.0/self_attn/Constant_35_output_0/blocks.0/self_attn/Constant_35"Constant*E value*9B+/blocks.0/self_attn/Constant_35_attr::valueJ  $/blocks.0/self_attn/Shape_6_output_0 (/blocks.0/self_attn/Constant_35_output_0&/blocks.0/self_attn/Gather_10_output_0/blocks.0/self_attn/Gather_10"Gather* axis t (/blocks.0/self_attn/Transpose_1_output_0$/blocks.0/self_attn/Shape_7_output_0/blocks.0/self_attn/Shape_7"Shape (/blocks.0/self_attn/Constant_36_output_0/blocks.0/self_attn/Constant_36"Constant*E value*9B+/blocks.0/self_attn/Constant_36_attr::valueJ  $/blocks.0/self_attn/Shape_7_output_0 (/blocks.0/self_attn/Constant_36_output_0&/blocks.0/self_attn/Gather_11_output_0/blocks.0/self_attn/Gather_11"Gather* axis (/blocks.0/self_attn/Constant_37_output_0/blocks.0/self_attn/Constant_37"Constant*G value*;B+/blocks.0/self_attn/Constant_37_attr::valueJ  (/blocks.0/self_attn/Transpose_1_output_0 (/blocks.0/self_attn/Constant_37_output_0)/blocks.0/self_attn/Unsqueeze_12_output_0 /blocks.0/self_attn/Unsqueeze_12" Unsqueeze (/blocks.0/self_attn/Constant_38_output_0/blocks.0/self_attn/Constant_38"Constant*E value*9B+/blocks.0/self_attn/Constant_38_attr::valueJ (/blocks.0/self_attn/Constant_39_output_0/blocks.0/self_attn/Constant_39"Constant*G value*;B+/blocks.0/self_attn/Constant_39_attr::valueJ  %/blocks.0/self_attn/Gather_8_output_0 (/blocks.0/self_attn/Constant_39_output_0)/blocks.0/self_attn/Unsqueeze_13_output_0 /blocks.0/self_attn/Unsqueeze_13" Unsqueeze (/blocks.0/self_attn/Constant_40_output_0/blocks.0/self_attn/Constant_40"Constant*G value*;B+/blocks.0/self_attn/Constant_40_attr::valueJ  %/blocks.0/self_attn/Gather_9_output_0 (/blocks.0/self_attn/Constant_40_output_0)/blocks.0/self_attn/Unsqueeze_14_output_0 /blocks.0/self_attn/Unsqueeze_14" Unsqueeze (/blocks.0/self_attn/Constant_41_output_0/blocks.0/self_attn/Constant_41"Constant*G value*;B+/blocks.0/self_attn/Constant_41_attr::valueJ (/blocks.0/self_attn/Constant_42_output_0/blocks.0/self_attn/Constant_42"Constant*G value*;B+/blocks.0/self_attn/Constant_42_attr::valueJ  &/blocks.0/self_attn/Gather_10_output_0 (/blocks.0/self_attn/Constant_42_output_0)/blocks.0/self_attn/Unsqueeze_15_output_0 /blocks.0/self_attn/Unsqueeze_15" Unsqueeze (/blocks.0/self_attn/Constant_43_output_0/blocks.0/self_attn/Constant_43"Constant*G value*;B+/blocks.0/self_attn/Constant_43_attr::valueJ  &/blocks.0/self_attn/Gather_11_output_0 (/blocks.0/self_attn/Constant_43_output_0)/blocks.0/self_attn/Unsqueeze_16_output_0 /blocks.0/self_attn/Unsqueeze_16" Unsqueeze  )/blocks.0/self_attn/Unsqueeze_13_output_0 )/blocks.0/self_attn/Unsqueeze_14_output_0 (/blocks.0/self_attn/Constant_41_output_0 )/blocks.0/self_attn/Unsqueeze_15_output_0 )/blocks.0/self_attn/Unsqueeze_16_output_0%/blocks.0/self_attn/Concat_8_output_0/blocks.0/self_attn/Concat_8"Concat* axis (/blocks.0/self_attn/Constant_44_output_0/blocks.0/self_attn/Constant_44"Constant*G value*;B+/blocks.0/self_attn/Constant_44_attr::valueJ  %/blocks.0/self_attn/Concat_8_output_0 (/blocks.0/self_attn/Constant_44_output_0&/blocks.0/self_attn/Reshape_3_output_0/blocks.0/self_attn/Reshape_3"Reshape* allowzero r &/blocks.0/self_attn/Reshape_3_output_0$/blocks.0/self_attn/Shape_8_output_0/blocks.0/self_attn/Shape_8"Shape  $/blocks.0/self_attn/Shape_8_output_0,/blocks.0/self_attn/ConstantOfShape_output_0#/blocks.0/self_attn/ConstantOfShape"ConstantOfShape*K value*?B//blocks.0/self_attn/ConstantOfShape_attr::valueJ (/blocks.0/self_attn/Constant_45_output_0/blocks.0/self_attn/Constant_45"Constant*E value*9B+/blocks.0/self_attn/Constant_45_attr::valueJ  ,/blocks.0/self_attn/ConstantOfShape_output_0 (/blocks.0/self_attn/Constant_45_output_0"/blocks.0/self_attn/Mul_4_output_0/blocks.0/self_attn/Mul_4"Mul  &/blocks.0/self_attn/Reshape_3_output_0 "/blocks.0/self_attn/Mul_4_output_0"/blocks.0/self_attn/Equal_output_0/blocks.0/self_attn/Equal"Equal  "/blocks.0/self_attn/Equal_output_0 ,/blocks.0/self_attn/ConstantOfShape_output_0 &/blocks.0/self_attn/Reshape_3_output_0"/blocks.0/self_attn/Where_output_0/blocks.0/self_attn/Where"Where  )/blocks.0/self_attn/Unsqueeze_12_output_0 "/blocks.0/self_attn/Where_output_0#/blocks.0/self_attn/Expand_output_0/blocks.0/self_attn/Expand"Expand (/blocks.0/self_attn/Constant_46_output_0/blocks.0/self_attn/Constant_46"Constant*E value*9B+/blocks.0/self_attn/Constant_46_attr::valueJ  %/blocks.0/self_attn/Gather_9_output_0 (/blocks.0/self_attn/Constant_46_output_0"/blocks.0/self_attn/Mul_5_output_0/blocks.0/self_attn/Mul_5"Mul eonnx::Unsqueeze_538 Constant_2701"Constant*5 value*)BConstant_2701_attr::valueJ  %/blocks.0/self_attn/Gather_8_output_0 onnx::Unsqueeze_538)/blocks.0/self_attn/Unsqueeze_17_output_0 /blocks.0/self_attn/Unsqueeze_17" Unsqueeze eonnx::Unsqueeze_540 Constant_2703"Constant*5 value*)BConstant_2703_attr::valueJ  "/blocks.0/self_attn/Mul_5_output_0 onnx::Unsqueeze_540)/blocks.0/self_attn/Unsqueeze_18_output_0 /blocks.0/self_attn/Unsqueeze_18" Unsqueeze eonnx::Unsqueeze_542 Constant_2705"Constant*5 value*)BConstant_2705_attr::valueJ  &/blocks.0/self_attn/Gather_10_output_0 onnx::Unsqueeze_542)/blocks.0/self_attn/Unsqueeze_19_output_0 /blocks.0/self_attn/Unsqueeze_19" Unsqueeze eonnx::Unsqueeze_544 Constant_2707"Constant*5 value*)BConstant_2707_attr::valueJ  &/blocks.0/self_attn/Gather_11_output_0 onnx::Unsqueeze_544)/blocks.0/self_attn/Unsqueeze_20_output_0 /blocks.0/self_attn/Unsqueeze_20" Unsqueeze  )/blocks.0/self_attn/Unsqueeze_17_output_0 )/blocks.0/self_attn/Unsqueeze_18_output_0 )/blocks.0/self_attn/Unsqueeze_19_output_0 )/blocks.0/self_attn/Unsqueeze_20_output_0%/blocks.0/self_attn/Concat_9_output_0/blocks.0/self_attn/Concat_9"Concat* axis  #/blocks.0/self_attn/Expand_output_0 %/blocks.0/self_attn/Concat_9_output_0&/blocks.0/self_attn/Reshape_4_output_0/blocks.0/self_attn/Reshape_4"Reshape* allowzero t (/blocks.0/self_attn/Transpose_2_output_0$/blocks.0/self_attn/Shape_9_output_0/blocks.0/self_attn/Shape_9"Shape (/blocks.0/self_attn/Constant_47_output_0/blocks.0/self_attn/Constant_47"Constant*E value*9B+/blocks.0/self_attn/Constant_47_attr::valueJ  $/blocks.0/self_attn/Shape_9_output_0 (/blocks.0/self_attn/Constant_47_output_0&/blocks.0/self_attn/Gather_12_output_0/blocks.0/self_attn/Gather_12"Gather* axis v (/blocks.0/self_attn/Transpose_2_output_0%/blocks.0/self_attn/Shape_10_output_0/blocks.0/self_attn/Shape_10"Shape (/blocks.0/self_attn/Constant_48_output_0/blocks.0/self_attn/Constant_48"Constant*E value*9B+/blocks.0/self_attn/Constant_48_attr::valueJ  %/blocks.0/self_attn/Shape_10_output_0 (/blocks.0/self_attn/Constant_48_output_0&/blocks.0/self_attn/Gather_13_output_0/blocks.0/self_attn/Gather_13"Gather* axis v (/blocks.0/self_attn/Transpose_2_output_0%/blocks.0/self_attn/Shape_11_output_0/blocks.0/self_attn/Shape_11"Shape (/blocks.0/self_attn/Constant_49_output_0/blocks.0/self_attn/Constant_49"Constant*E value*9B+/blocks.0/self_attn/Constant_49_attr::valueJ  %/blocks.0/self_attn/Shape_11_output_0 (/blocks.0/self_attn/Constant_49_output_0&/blocks.0/self_attn/Gather_14_output_0/blocks.0/self_attn/Gather_14"Gather* axis v (/blocks.0/self_attn/Transpose_2_output_0%/blocks.0/self_attn/Shape_12_output_0/blocks.0/self_attn/Shape_12"Shape (/blocks.0/self_attn/Constant_50_output_0/blocks.0/self_attn/Constant_50"Constant*E value*9B+/blocks.0/self_attn/Constant_50_attr::valueJ  %/blocks.0/self_attn/Shape_12_output_0 (/blocks.0/self_attn/Constant_50_output_0&/blocks.0/self_attn/Gather_15_output_0/blocks.0/self_attn/Gather_15"Gather* axis (/blocks.0/self_attn/Constant_51_output_0/blocks.0/self_attn/Constant_51"Constant*G value*;B+/blocks.0/self_attn/Constant_51_attr::valueJ  (/blocks.0/self_attn/Transpose_2_output_0 (/blocks.0/self_attn/Constant_51_output_0)/blocks.0/self_attn/Unsqueeze_21_output_0 /blocks.0/self_attn/Unsqueeze_21" Unsqueeze (/blocks.0/self_attn/Constant_52_output_0/blocks.0/self_attn/Constant_52"Constant*G value*;B+/blocks.0/self_attn/Constant_52_attr::valueJ  &/blocks.0/self_attn/Gather_12_output_0 (/blocks.0/self_attn/Constant_52_output_0)/blocks.0/self_attn/Unsqueeze_22_output_0 /blocks.0/self_attn/Unsqueeze_22" Unsqueeze (/blocks.0/self_attn/Constant_53_output_0/blocks.0/self_attn/Constant_53"Constant*G value*;B+/blocks.0/self_attn/Constant_53_attr::valueJ  &/blocks.0/self_attn/Gather_13_output_0 (/blocks.0/self_attn/Constant_53_output_0)/blocks.0/self_attn/Unsqueeze_23_output_0 /blocks.0/self_attn/Unsqueeze_23" Unsqueeze (/blocks.0/self_attn/Constant_54_output_0/blocks.0/self_attn/Constant_54"Constant*G value*;B+/blocks.0/self_attn/Constant_54_attr::valueJ (/blocks.0/self_attn/Constant_55_output_0/blocks.0/self_attn/Constant_55"Constant*G value*;B+/blocks.0/self_attn/Constant_55_attr::valueJ  &/blocks.0/self_attn/Gather_14_output_0 (/blocks.0/self_attn/Constant_55_output_0)/blocks.0/self_attn/Unsqueeze_24_output_0 /blocks.0/self_attn/Unsqueeze_24" Unsqueeze (/blocks.0/self_attn/Constant_56_output_0/blocks.0/self_attn/Constant_56"Constant*G value*;B+/blocks.0/self_attn/Constant_56_attr::valueJ  &/blocks.0/self_attn/Gather_15_output_0 (/blocks.0/self_attn/Constant_56_output_0)/blocks.0/self_attn/Unsqueeze_25_output_0 /blocks.0/self_attn/Unsqueeze_25" Unsqueeze  )/blocks.0/self_attn/Unsqueeze_22_output_0 )/blocks.0/self_attn/Unsqueeze_23_output_0 (/blocks.0/self_attn/Constant_54_output_0 )/blocks.0/self_attn/Unsqueeze_24_output_0 )/blocks.0/self_attn/Unsqueeze_25_output_0&/blocks.0/self_attn/Concat_10_output_0/blocks.0/self_attn/Concat_10"Concat* axis (/blocks.0/self_attn/Constant_57_output_0/blocks.0/self_attn/Constant_57"Constant*G value*;B+/blocks.0/self_attn/Constant_57_attr::valueJ  &/blocks.0/self_attn/Concat_10_output_0 (/blocks.0/self_attn/Constant_57_output_0&/blocks.0/self_attn/Reshape_5_output_0/blocks.0/self_attn/Reshape_5"Reshape* allowzero t &/blocks.0/self_attn/Reshape_5_output_0%/blocks.0/self_attn/Shape_13_output_0/blocks.0/self_attn/Shape_13"Shape  %/blocks.0/self_attn/Shape_13_output_0./blocks.0/self_attn/ConstantOfShape_1_output_0%/blocks.0/self_attn/ConstantOfShape_1"ConstantOfShape*M value*AB1/blocks.0/self_attn/ConstantOfShape_1_attr::valueJ (/blocks.0/self_attn/Constant_58_output_0/blocks.0/self_attn/Constant_58"Constant*E value*9B+/blocks.0/self_attn/Constant_58_attr::valueJ  ./blocks.0/self_attn/ConstantOfShape_1_output_0 (/blocks.0/self_attn/Constant_58_output_0"/blocks.0/self_attn/Mul_6_output_0/blocks.0/self_attn/Mul_6"Mul  &/blocks.0/self_attn/Reshape_5_output_0 "/blocks.0/self_attn/Mul_6_output_0$/blocks.0/self_attn/Equal_1_output_0/blocks.0/self_attn/Equal_1"Equal  $/blocks.0/self_attn/Equal_1_output_0 ./blocks.0/self_attn/ConstantOfShape_1_output_0 &/blocks.0/self_attn/Reshape_5_output_0$/blocks.0/self_attn/Where_1_output_0/blocks.0/self_attn/Where_1"Where  )/blocks.0/self_attn/Unsqueeze_21_output_0 $/blocks.0/self_attn/Where_1_output_0%/blocks.0/self_attn/Expand_1_output_0/blocks.0/self_attn/Expand_1"Expand (/blocks.0/self_attn/Constant_59_output_0/blocks.0/self_attn/Constant_59"Constant*E value*9B+/blocks.0/self_attn/Constant_59_attr::valueJ  &/blocks.0/self_attn/Gather_13_output_0 (/blocks.0/self_attn/Constant_59_output_0"/blocks.0/self_attn/Mul_7_output_0/blocks.0/self_attn/Mul_7"Mul eonnx::Unsqueeze_584 Constant_2746"Constant*5 value*)BConstant_2746_attr::valueJ  &/blocks.0/self_attn/Gather_12_output_0 onnx::Unsqueeze_584)/blocks.0/self_attn/Unsqueeze_26_output_0 /blocks.0/self_attn/Unsqueeze_26" Unsqueeze eonnx::Unsqueeze_586 Constant_2748"Constant*5 value*)BConstant_2748_attr::valueJ  "/blocks.0/self_attn/Mul_7_output_0 onnx::Unsqueeze_586)/blocks.0/self_attn/Unsqueeze_27_output_0 /blocks.0/self_attn/Unsqueeze_27" Unsqueeze eonnx::Unsqueeze_588 Constant_2750"Constant*5 value*)BConstant_2750_attr::valueJ  &/blocks.0/self_attn/Gather_14_output_0 onnx::Unsqueeze_588)/blocks.0/self_attn/Unsqueeze_28_output_0 /blocks.0/self_attn/Unsqueeze_28" Unsqueeze eonnx::Unsqueeze_590 Constant_2752"Constant*5 value*)BConstant_2752_attr::valueJ  &/blocks.0/self_attn/Gather_15_output_0 onnx::Unsqueeze_590)/blocks.0/self_attn/Unsqueeze_29_output_0 /blocks.0/self_attn/Unsqueeze_29" Unsqueeze  )/blocks.0/self_attn/Unsqueeze_26_output_0 )/blocks.0/self_attn/Unsqueeze_27_output_0 )/blocks.0/self_attn/Unsqueeze_28_output_0 )/blocks.0/self_attn/Unsqueeze_29_output_0&/blocks.0/self_attn/Concat_11_output_0/blocks.0/self_attn/Concat_11"Concat* axis  %/blocks.0/self_attn/Expand_1_output_0 &/blocks.0/self_attn/Concat_11_output_0&/blocks.0/self_attn/Reshape_6_output_0/blocks.0/self_attn/Reshape_6"Reshape* allowzero  &/blocks.0/self_attn/Transpose_output_0 &/blocks.0/self_attn/Reshape_4_output_0#/blocks.0/self_attn/MatMul_output_0/blocks.0/self_attn/MatMul"MatMul (/blocks.0/self_attn/Constant_60_output_0/blocks.0/self_attn/Constant_60"Constant*A value*5B+/blocks.0/self_attn/Constant_60_attr::valueJ5A  #/blocks.0/self_attn/MatMul_output_0 (/blocks.0/self_attn/Constant_60_output_0"/blocks.0/self_attn/Div_2_output_0/blocks.0/self_attn/Div_2"Div x "/blocks.0/self_attn/Div_2_output_0 attention_mask"/blocks.0/self_attn/Add_2_output_0/blocks.0/self_attn/Add_2"Add  "/blocks.0/self_attn/Add_2_output_0$/blocks.0/self_attn/Softmax_output_0/blocks.0/self_attn/Softmax"Softmax* axis x $/blocks.0/self_attn/Softmax_output_0#/blocks.0/self_attn/Cast_4_output_0/blocks.0/self_attn/Cast_4"Cast* to  #/blocks.0/self_attn/Cast_4_output_0 &/blocks.0/self_attn/Reshape_6_output_0%/blocks.0/self_attn/MatMul_1_output_0/blocks.0/self_attn/MatMul_1"MatMul  %/blocks.0/self_attn/MatMul_1_output_0(/blocks.0/self_attn/Transpose_3_output_0/blocks.0/self_attn/Transpose_3" Transpose* perm@@@@ eonnx::Unsqueeze_602 Constant_2764"Constant*5 value*)BConstant_2764_attr::valueJ  #/blocks.0/self_attn/Gather_output_0 onnx::Unsqueeze_602)/blocks.0/self_attn/Unsqueeze_30_output_0 /blocks.0/self_attn/Unsqueeze_30" Unsqueeze eonnx::Unsqueeze_604 Constant_2766"Constant*5 value*)BConstant_2766_attr::valueJ  %/blocks.0/self_attn/Gather_1_output_0 onnx::Unsqueeze_604)/blocks.0/self_attn/Unsqueeze_31_output_0 /blocks.0/self_attn/Unsqueeze_31" Unsqueeze (/blocks.0/self_attn/Constant_61_output_0/blocks.0/self_attn/Constant_61"Constant*G value*;B+/blocks.0/self_attn/Constant_61_attr::valueJ  )/blocks.0/self_attn/Unsqueeze_30_output_0 )/blocks.0/self_attn/Unsqueeze_31_output_0 (/blocks.0/self_attn/Constant_61_output_0&/blocks.0/self_attn/Concat_12_output_0/blocks.0/self_attn/Concat_12"Concat* axis  (/blocks.0/self_attn/Transpose_3_output_0 &/blocks.0/self_attn/Concat_12_output_0&/blocks.0/self_attn/Reshape_7_output_0/blocks.0/self_attn/Reshape_7"Reshape* allowzero  &/blocks.0/self_attn/Reshape_7_output_0 onnx::MatMul_8589*/blocks.0/self_attn/o_proj/MatMul_output_0!/blocks.0/self_attn/o_proj/MatMul"MatMul  )/blocks.0/input_layernorm/Cast_1_output_0 */blocks.0/self_attn/o_proj/MatMul_output_0/blocks.0/Add_output_0 /blocks.0/Add"Add  /blocks.0/Add_output_00/blocks.0/post_attention_layernorm/Cast_output_0'/blocks.0/post_attention_layernorm/Cast"Cast* to 4/blocks.0/post_attention_layernorm/Constant_output_0+/blocks.0/post_attention_layernorm/Constant"Constant*M value*AB7/blocks.0/post_attention_layernorm/Constant_attr::valueJ@  0/blocks.0/post_attention_layernorm/Cast_output_0 4/blocks.0/post_attention_layernorm/Constant_output_0//blocks.0/post_attention_layernorm/Pow_output_0&/blocks.0/post_attention_layernorm/Pow"Pow  //blocks.0/post_attention_layernorm/Pow_output_06/blocks.0/post_attention_layernorm/ReduceMean_output_0-/blocks.0/post_attention_layernorm/ReduceMean" ReduceMean* axes@* keepdims 6/blocks.0/post_attention_layernorm/Constant_1_output_0-/blocks.0/post_attention_layernorm/Constant_1"Constant*O value*CB9/blocks.0/post_attention_layernorm/Constant_1_attr::valueJ75  6/blocks.0/post_attention_layernorm/ReduceMean_output_0 6/blocks.0/post_attention_layernorm/Constant_1_output_0//blocks.0/post_attention_layernorm/Add_output_0&/blocks.0/post_attention_layernorm/Add"Add  //blocks.0/post_attention_layernorm/Add_output_00/blocks.0/post_attention_layernorm/Sqrt_output_0'/blocks.0/post_attention_layernorm/Sqrt"Sqrt 6/blocks.0/post_attention_layernorm/Constant_2_output_0-/blocks.0/post_attention_layernorm/Constant_2"Constant*O value*CB9/blocks.0/post_attention_layernorm/Constant_2_attr::valueJ?  6/blocks.0/post_attention_layernorm/Constant_2_output_0 0/blocks.0/post_attention_layernorm/Sqrt_output_0//blocks.0/post_attention_layernorm/Div_output_0&/blocks.0/post_attention_layernorm/Div"Div  0/blocks.0/post_attention_layernorm/Cast_output_02/blocks.0/post_attention_layernorm/Cast_1_output_0)/blocks.0/post_attention_layernorm/Cast_1"Cast* to  2/blocks.0/post_attention_layernorm/Cast_1_output_0 //blocks.0/post_attention_layernorm/Div_output_0//blocks.0/post_attention_layernorm/Mul_output_0&/blocks.0/post_attention_layernorm/Mul"Mul  //blocks.0/post_attention_layernorm/Mul_output_0 (blocks.0.post_attention_layernorm.weight1/blocks.0/post_attention_layernorm/Mul_1_output_0(/blocks.0/post_attention_layernorm/Mul_1"Mul  1/blocks.0/post_attention_layernorm/Mul_1_output_02/blocks.0/post_attention_layernorm/Cast_2_output_0)/blocks.0/post_attention_layernorm/Cast_2"Cast* to  2/blocks.0/post_attention_layernorm/Cast_2_output_0 onnx::MatMul_8590'/blocks.0/mlp/gate_proj/MatMul_output_0/blocks.0/mlp/gate_proj/MatMul"MatMul w '/blocks.0/mlp/gate_proj/MatMul_output_0%/blocks.0/mlp/act_fn/Sigmoid_output_0/blocks.0/mlp/act_fn/Sigmoid"Sigmoid  '/blocks.0/mlp/gate_proj/MatMul_output_0 %/blocks.0/mlp/act_fn/Sigmoid_output_0!/blocks.0/mlp/act_fn/Mul_output_0/blocks.0/mlp/act_fn/Mul"Mul  2/blocks.0/post_attention_layernorm/Cast_2_output_0 onnx::MatMul_8591%/blocks.0/mlp/up_proj/MatMul_output_0/blocks.0/mlp/up_proj/MatMul"MatMul ~ !/blocks.0/mlp/act_fn/Mul_output_0 %/blocks.0/mlp/up_proj/MatMul_output_0/blocks.0/mlp/Mul_output_0/blocks.0/mlp/Mul"Mul  /blocks.0/mlp/Mul_output_0 onnx::MatMul_8592'/blocks.0/mlp/down_proj/MatMul_output_0/blocks.0/mlp/down_proj/MatMul"MatMul  2/blocks.0/post_attention_layernorm/Cast_1_output_0 '/blocks.0/mlp/down_proj/MatMul_output_0/blocks.0/Add_1_output_0/blocks.0/Add_1"Add b past_key_values /rotary/Constant_8_output_0/Gather_1_output_0 /Gather_1"Gather* axis /blocks.1/Constant_output_0/blocks.1/Constant"Constant*J value*>B/blocks.1/Constant_attr::valueJ  /blocks.0/Add_1_output_0 /blocks.1/Constant_output_0/blocks.1/Reshape_output_0/blocks.1/Reshape"Reshape* allowzero v /blocks.1/Reshape_output_0'/blocks.1/input_layernorm/Cast_output_0/blocks.1/input_layernorm/Cast"Cast* to +/blocks.1/input_layernorm/Constant_output_0"/blocks.1/input_layernorm/Constant"Constant*D value*8B./blocks.1/input_layernorm/Constant_attr::valueJ@  '/blocks.1/input_layernorm/Cast_output_0 +/blocks.1/input_layernorm/Constant_output_0&/blocks.1/input_layernorm/Pow_output_0/blocks.1/input_layernorm/Pow"Pow  &/blocks.1/input_layernorm/Pow_output_0-/blocks.1/input_layernorm/ReduceMean_output_0$/blocks.1/input_layernorm/ReduceMean" ReduceMean* axes@* keepdims -/blocks.1/input_layernorm/Constant_1_output_0$/blocks.1/input_layernorm/Constant_1"Constant*F value*:B0/blocks.1/input_layernorm/Constant_1_attr::valueJ75  -/blocks.1/input_layernorm/ReduceMean_output_0 -/blocks.1/input_layernorm/Constant_1_output_0&/blocks.1/input_layernorm/Add_output_0/blocks.1/input_layernorm/Add"Add w &/blocks.1/input_layernorm/Add_output_0'/blocks.1/input_layernorm/Sqrt_output_0/blocks.1/input_layernorm/Sqrt"Sqrt -/blocks.1/input_layernorm/Constant_2_output_0$/blocks.1/input_layernorm/Constant_2"Constant*F value*:B0/blocks.1/input_layernorm/Constant_2_attr::valueJ?  -/blocks.1/input_layernorm/Constant_2_output_0 '/blocks.1/input_layernorm/Sqrt_output_0&/blocks.1/input_layernorm/Div_output_0/blocks.1/input_layernorm/Div"Div  '/blocks.1/input_layernorm/Cast_output_0)/blocks.1/input_layernorm/Cast_1_output_0 /blocks.1/input_layernorm/Cast_1"Cast* to  )/blocks.1/input_layernorm/Cast_1_output_0 &/blocks.1/input_layernorm/Div_output_0&/blocks.1/input_layernorm/Mul_output_0/blocks.1/input_layernorm/Mul"Mul  &/blocks.1/input_layernorm/Mul_output_0 blocks.1.input_layernorm.weight(/blocks.1/input_layernorm/Mul_1_output_0/blocks.1/input_layernorm/Mul_1"Mul  (/blocks.1/input_layernorm/Mul_1_output_0)/blocks.1/input_layernorm/Cast_2_output_0 /blocks.1/input_layernorm/Cast_2"Cast* to q )/blocks.1/input_layernorm/Cast_2_output_0"/blocks.1/self_attn/Shape_output_0/blocks.1/self_attn/Shape"Shape %/blocks.1/self_attn/Constant_output_0/blocks.1/self_attn/Constant"Constant*B value*6B(/blocks.1/self_attn/Constant_attr::valueJ  "/blocks.1/self_attn/Shape_output_0 %/blocks.1/self_attn/Constant_output_0#/blocks.1/self_attn/Gather_output_0/blocks.1/self_attn/Gather"Gather* axis u )/blocks.1/input_layernorm/Cast_2_output_0$/blocks.1/self_attn/Shape_1_output_0/blocks.1/self_attn/Shape_1"Shape '/blocks.1/self_attn/Constant_1_output_0/blocks.1/self_attn/Constant_1"Constant*D value*8B*/blocks.1/self_attn/Constant_1_attr::valueJ  $/blocks.1/self_attn/Shape_1_output_0 '/blocks.1/self_attn/Constant_1_output_0%/blocks.1/self_attn/Gather_1_output_0/blocks.1/self_attn/Gather_1"Gather* axis  )/blocks.1/input_layernorm/Cast_2_output_0 onnx::MatMul_8593*/blocks.1/self_attn/q_proj/MatMul_output_0!/blocks.1/self_attn/q_proj/MatMul"MatMul  )/blocks.1/input_layernorm/Cast_2_output_0 onnx::MatMul_8594*/blocks.1/self_attn/k_proj/MatMul_output_0!/blocks.1/self_attn/k_proj/MatMul"MatMul  )/blocks.1/input_layernorm/Cast_2_output_0 onnx::MatMul_8595*/blocks.1/self_attn/v_proj/MatMul_output_0!/blocks.1/self_attn/v_proj/MatMul"MatMul eonnx::Unsqueeze_664 Constant_2818"Constant*5 value*)BConstant_2818_attr::valueJ  #/blocks.1/self_attn/Gather_output_0 onnx::Unsqueeze_664&/blocks.1/self_attn/Unsqueeze_output_0/blocks.1/self_attn/Unsqueeze" Unsqueeze eonnx::Unsqueeze_666 Constant_2820"Constant*5 value*)BConstant_2820_attr::valueJ  %/blocks.1/self_attn/Gather_1_output_0 onnx::Unsqueeze_666(/blocks.1/self_attn/Unsqueeze_1_output_0/blocks.1/self_attn/Unsqueeze_1" Unsqueeze '/blocks.1/self_attn/Constant_2_output_0/blocks.1/self_attn/Constant_2"Constant*F value*:B*/blocks.1/self_attn/Constant_2_attr::valueJ '/blocks.1/self_attn/Constant_3_output_0/blocks.1/self_attn/Constant_3"Constant*F value*:B*/blocks.1/self_attn/Constant_3_attr::valueJ  &/blocks.1/self_attn/Unsqueeze_output_0 (/blocks.1/self_attn/Unsqueeze_1_output_0 '/blocks.1/self_attn/Constant_2_output_0 '/blocks.1/self_attn/Constant_3_output_0#/blocks.1/self_attn/Concat_output_0/blocks.1/self_attn/Concat"Concat* axis  */blocks.1/self_attn/q_proj/MatMul_output_0 #/blocks.1/self_attn/Concat_output_0$/blocks.1/self_attn/Reshape_output_0/blocks.1/self_attn/Reshape"Reshape* allowzero eonnx::Unsqueeze_674 Constant_2826"Constant*5 value*)BConstant_2826_attr::valueJ  #/blocks.1/self_attn/Gather_output_0 onnx::Unsqueeze_674(/blocks.1/self_attn/Unsqueeze_2_output_0/blocks.1/self_attn/Unsqueeze_2" Unsqueeze eonnx::Unsqueeze_676 Constant_2828"Constant*5 value*)BConstant_2828_attr::valueJ  %/blocks.1/self_attn/Gather_1_output_0 onnx::Unsqueeze_676(/blocks.1/self_attn/Unsqueeze_3_output_0/blocks.1/self_attn/Unsqueeze_3" Unsqueeze '/blocks.1/self_attn/Constant_4_output_0/blocks.1/self_attn/Constant_4"Constant*F value*:B*/blocks.1/self_attn/Constant_4_attr::valueJ '/blocks.1/self_attn/Constant_5_output_0/blocks.1/self_attn/Constant_5"Constant*F value*:B*/blocks.1/self_attn/Constant_5_attr::valueJ  (/blocks.1/self_attn/Unsqueeze_2_output_0 (/blocks.1/self_attn/Unsqueeze_3_output_0 '/blocks.1/self_attn/Constant_4_output_0 '/blocks.1/self_attn/Constant_5_output_0%/blocks.1/self_attn/Concat_1_output_0/blocks.1/self_attn/Concat_1"Concat* axis eonnx::Unsqueeze_683 Constant_2833"Constant*5 value*)BConstant_2833_attr::valueJ  #/blocks.1/self_attn/Gather_output_0 onnx::Unsqueeze_683(/blocks.1/self_attn/Unsqueeze_4_output_0/blocks.1/self_attn/Unsqueeze_4" Unsqueeze eonnx::Unsqueeze_685 Constant_2835"Constant*5 value*)BConstant_2835_attr::valueJ  %/blocks.1/self_attn/Gather_1_output_0 onnx::Unsqueeze_685(/blocks.1/self_attn/Unsqueeze_5_output_0/blocks.1/self_attn/Unsqueeze_5" Unsqueeze '/blocks.1/self_attn/Constant_6_output_0/blocks.1/self_attn/Constant_6"Constant*F value*:B*/blocks.1/self_attn/Constant_6_attr::valueJ '/blocks.1/self_attn/Constant_7_output_0/blocks.1/self_attn/Constant_7"Constant*F value*:B*/blocks.1/self_attn/Constant_7_attr::valueJ  (/blocks.1/self_attn/Unsqueeze_4_output_0 (/blocks.1/self_attn/Unsqueeze_5_output_0 '/blocks.1/self_attn/Constant_6_output_0 '/blocks.1/self_attn/Constant_7_output_0%/blocks.1/self_attn/Concat_2_output_0/blocks.1/self_attn/Concat_2"Concat* axis  */blocks.1/self_attn/k_proj/MatMul_output_0 %/blocks.1/self_attn/Concat_1_output_0&/blocks.1/self_attn/Reshape_1_output_0/blocks.1/self_attn/Reshape_1"Reshape* allowzero  */blocks.1/self_attn/v_proj/MatMul_output_0 %/blocks.1/self_attn/Concat_2_output_0&/blocks.1/self_attn/Reshape_2_output_0/blocks.1/self_attn/Reshape_2"Reshape* allowzero  $/blocks.1/self_attn/Reshape_output_0(/blocks.1/self_attn/q_norm/Cast_output_0/blocks.1/self_attn/q_norm/Cast"Cast* to ,/blocks.1/self_attn/q_norm/Constant_output_0#/blocks.1/self_attn/q_norm/Constant"Constant*E value*9B//blocks.1/self_attn/q_norm/Constant_attr::valueJ@  (/blocks.1/self_attn/q_norm/Cast_output_0 ,/blocks.1/self_attn/q_norm/Constant_output_0'/blocks.1/self_attn/q_norm/Pow_output_0/blocks.1/self_attn/q_norm/Pow"Pow  '/blocks.1/self_attn/q_norm/Pow_output_0./blocks.1/self_attn/q_norm/ReduceMean_output_0%/blocks.1/self_attn/q_norm/ReduceMean" ReduceMean* axes@* keepdims ./blocks.1/self_attn/q_norm/Constant_1_output_0%/blocks.1/self_attn/q_norm/Constant_1"Constant*G value*;B1/blocks.1/self_attn/q_norm/Constant_1_attr::valueJ75  ./blocks.1/self_attn/q_norm/ReduceMean_output_0 ./blocks.1/self_attn/q_norm/Constant_1_output_0'/blocks.1/self_attn/q_norm/Add_output_0/blocks.1/self_attn/q_norm/Add"Add z '/blocks.1/self_attn/q_norm/Add_output_0(/blocks.1/self_attn/q_norm/Sqrt_output_0/blocks.1/self_attn/q_norm/Sqrt"Sqrt ./blocks.1/self_attn/q_norm/Constant_2_output_0%/blocks.1/self_attn/q_norm/Constant_2"Constant*G value*;B1/blocks.1/self_attn/q_norm/Constant_2_attr::valueJ?  ./blocks.1/self_attn/q_norm/Constant_2_output_0 (/blocks.1/self_attn/q_norm/Sqrt_output_0'/blocks.1/self_attn/q_norm/Div_output_0/blocks.1/self_attn/q_norm/Div"Div  (/blocks.1/self_attn/q_norm/Cast_output_0*/blocks.1/self_attn/q_norm/Cast_1_output_0!/blocks.1/self_attn/q_norm/Cast_1"Cast* to  */blocks.1/self_attn/q_norm/Cast_1_output_0 '/blocks.1/self_attn/q_norm/Div_output_0'/blocks.1/self_attn/q_norm/Mul_output_0/blocks.1/self_attn/q_norm/Mul"Mul  '/blocks.1/self_attn/q_norm/Mul_output_0 blocks.1.self_attn.q_norm.weight)/blocks.1/self_attn/q_norm/Mul_1_output_0 /blocks.1/self_attn/q_norm/Mul_1"Mul  )/blocks.1/self_attn/q_norm/Mul_1_output_0*/blocks.1/self_attn/q_norm/Cast_2_output_0!/blocks.1/self_attn/q_norm/Cast_2"Cast* to  &/blocks.1/self_attn/Reshape_1_output_0(/blocks.1/self_attn/k_norm/Cast_output_0/blocks.1/self_attn/k_norm/Cast"Cast* to ,/blocks.1/self_attn/k_norm/Constant_output_0#/blocks.1/self_attn/k_norm/Constant"Constant*E value*9B//blocks.1/self_attn/k_norm/Constant_attr::valueJ@  (/blocks.1/self_attn/k_norm/Cast_output_0 ,/blocks.1/self_attn/k_norm/Constant_output_0'/blocks.1/self_attn/k_norm/Pow_output_0/blocks.1/self_attn/k_norm/Pow"Pow  '/blocks.1/self_attn/k_norm/Pow_output_0./blocks.1/self_attn/k_norm/ReduceMean_output_0%/blocks.1/self_attn/k_norm/ReduceMean" ReduceMean* axes@* keepdims ./blocks.1/self_attn/k_norm/Constant_1_output_0%/blocks.1/self_attn/k_norm/Constant_1"Constant*G value*;B1/blocks.1/self_attn/k_norm/Constant_1_attr::valueJ75  ./blocks.1/self_attn/k_norm/ReduceMean_output_0 ./blocks.1/self_attn/k_norm/Constant_1_output_0'/blocks.1/self_attn/k_norm/Add_output_0/blocks.1/self_attn/k_norm/Add"Add z '/blocks.1/self_attn/k_norm/Add_output_0(/blocks.1/self_attn/k_norm/Sqrt_output_0/blocks.1/self_attn/k_norm/Sqrt"Sqrt ./blocks.1/self_attn/k_norm/Constant_2_output_0%/blocks.1/self_attn/k_norm/Constant_2"Constant*G value*;B1/blocks.1/self_attn/k_norm/Constant_2_attr::valueJ?  ./blocks.1/self_attn/k_norm/Constant_2_output_0 (/blocks.1/self_attn/k_norm/Sqrt_output_0'/blocks.1/self_attn/k_norm/Div_output_0/blocks.1/self_attn/k_norm/Div"Div  (/blocks.1/self_attn/k_norm/Cast_output_0*/blocks.1/self_attn/k_norm/Cast_1_output_0!/blocks.1/self_attn/k_norm/Cast_1"Cast* to  */blocks.1/self_attn/k_norm/Cast_1_output_0 '/blocks.1/self_attn/k_norm/Div_output_0'/blocks.1/self_attn/k_norm/Mul_output_0/blocks.1/self_attn/k_norm/Mul"Mul  '/blocks.1/self_attn/k_norm/Mul_output_0 blocks.1.self_attn.k_norm.weight)/blocks.1/self_attn/k_norm/Mul_1_output_0 /blocks.1/self_attn/k_norm/Mul_1"Mul  )/blocks.1/self_attn/k_norm/Mul_1_output_0*/blocks.1/self_attn/k_norm/Cast_2_output_0!/blocks.1/self_attn/k_norm/Cast_2"Cast* to  */blocks.1/self_attn/q_norm/Cast_2_output_0 %/blocks.0/self_attn/Gather_2_output_0 /blocks.1/self_attn/Mul_output_0/blocks.1/self_attn/Mul"Mul v */blocks.1/self_attn/q_norm/Cast_2_output_0$/blocks.1/self_attn/Shape_2_output_0/blocks.1/self_attn/Shape_2"Shape '/blocks.1/self_attn/Constant_8_output_0/blocks.1/self_attn/Constant_8"Constant*D value*8B*/blocks.1/self_attn/Constant_8_attr::valueJ  $/blocks.1/self_attn/Shape_2_output_0 '/blocks.1/self_attn/Constant_8_output_0%/blocks.1/self_attn/Gather_2_output_0/blocks.1/self_attn/Gather_2"Gather* axis '/blocks.1/self_attn/Constant_9_output_0/blocks.1/self_attn/Constant_9"Constant*D value*8B*/blocks.1/self_attn/Constant_9_attr::valueJ  %/blocks.1/self_attn/Gather_2_output_0 '/blocks.1/self_attn/Constant_9_output_0 /blocks.1/self_attn/Div_output_0/blocks.1/self_attn/Div"Div p /blocks.1/self_attn/Div_output_0!/blocks.1/self_attn/Cast_output_0/blocks.1/self_attn/Cast"Cast* to u !/blocks.1/self_attn/Cast_output_0#/blocks.1/self_attn/Cast_1_output_0/blocks.1/self_attn/Cast_1"Cast* to (/blocks.1/self_attn/Constant_10_output_0/blocks.1/self_attn/Constant_10"Constant*G value*;B+/blocks.1/self_attn/Constant_10_attr::valueJ (/blocks.1/self_attn/Constant_11_output_0/blocks.1/self_attn/Constant_11"Constant*G value*;B+/blocks.1/self_attn/Constant_11_attr::valueJ (/blocks.1/self_attn/Constant_12_output_0/blocks.1/self_attn/Constant_12"Constant*G value*;B+/blocks.1/self_attn/Constant_12_attr::valueJ  #/blocks.1/self_attn/Cast_1_output_0 (/blocks.1/self_attn/Constant_12_output_0(/blocks.1/self_attn/Unsqueeze_6_output_0/blocks.1/self_attn/Unsqueeze_6" Unsqueeze (/blocks.1/self_attn/Constant_13_output_0/blocks.1/self_attn/Constant_13"Constant*G value*;B+/blocks.1/self_attn/Constant_13_attr::valueJ  */blocks.1/self_attn/q_norm/Cast_2_output_0 (/blocks.1/self_attn/Constant_11_output_0 (/blocks.1/self_attn/Unsqueeze_6_output_0 (/blocks.1/self_attn/Constant_10_output_0 (/blocks.1/self_attn/Constant_13_output_0"/blocks.1/self_attn/Slice_output_0/blocks.1/self_attn/Slice"Slice (/blocks.1/self_attn/Constant_14_output_0/blocks.1/self_attn/Constant_14"Constant*G value*;B+/blocks.1/self_attn/Constant_14_attr::valueJ (/blocks.1/self_attn/Constant_15_output_0/blocks.1/self_attn/Constant_15"Constant*G value*;B+/blocks.1/self_attn/Constant_15_attr::valueJ  #/blocks.1/self_attn/Cast_1_output_0 (/blocks.1/self_attn/Constant_15_output_0(/blocks.1/self_attn/Unsqueeze_7_output_0/blocks.1/self_attn/Unsqueeze_7" Unsqueeze (/blocks.1/self_attn/Constant_16_output_0/blocks.1/self_attn/Constant_16"Constant*G value*;B+/blocks.1/self_attn/Constant_16_attr::valueJ (/blocks.1/self_attn/Constant_17_output_0/blocks.1/self_attn/Constant_17"Constant*G value*;B+/blocks.1/self_attn/Constant_17_attr::valueJ  */blocks.1/self_attn/q_norm/Cast_2_output_0 (/blocks.1/self_attn/Unsqueeze_7_output_0 (/blocks.1/self_attn/Constant_16_output_0 (/blocks.1/self_attn/Constant_14_output_0 (/blocks.1/self_attn/Constant_17_output_0$/blocks.1/self_attn/Slice_1_output_0/blocks.1/self_attn/Slice_1"Slice f $/blocks.1/self_attn/Slice_1_output_0 /blocks.1/self_attn/Neg_output_0/blocks.1/self_attn/Neg"Neg  /blocks.1/self_attn/Neg_output_0 "/blocks.1/self_attn/Slice_output_0%/blocks.1/self_attn/Concat_3_output_0/blocks.1/self_attn/Concat_3"Concat* axis  %/blocks.1/self_attn/Concat_3_output_0 %/blocks.0/self_attn/Gather_3_output_0"/blocks.1/self_attn/Mul_1_output_0/blocks.1/self_attn/Mul_1"Mul  /blocks.1/self_attn/Mul_output_0 "/blocks.1/self_attn/Mul_1_output_0 /blocks.1/self_attn/Add_output_0/blocks.1/self_attn/Add"Add  */blocks.1/self_attn/k_norm/Cast_2_output_0 %/blocks.0/self_attn/Gather_2_output_0"/blocks.1/self_attn/Mul_2_output_0/blocks.1/self_attn/Mul_2"Mul v */blocks.1/self_attn/k_norm/Cast_2_output_0$/blocks.1/self_attn/Shape_3_output_0/blocks.1/self_attn/Shape_3"Shape (/blocks.1/self_attn/Constant_18_output_0/blocks.1/self_attn/Constant_18"Constant*E value*9B+/blocks.1/self_attn/Constant_18_attr::valueJ  $/blocks.1/self_attn/Shape_3_output_0 (/blocks.1/self_attn/Constant_18_output_0%/blocks.1/self_attn/Gather_3_output_0/blocks.1/self_attn/Gather_3"Gather* axis (/blocks.1/self_attn/Constant_19_output_0/blocks.1/self_attn/Constant_19"Constant*E value*9B+/blocks.1/self_attn/Constant_19_attr::valueJ  %/blocks.1/self_attn/Gather_3_output_0 (/blocks.1/self_attn/Constant_19_output_0"/blocks.1/self_attn/Div_1_output_0/blocks.1/self_attn/Div_1"Div v "/blocks.1/self_attn/Div_1_output_0#/blocks.1/self_attn/Cast_2_output_0/blocks.1/self_attn/Cast_2"Cast* to w #/blocks.1/self_attn/Cast_2_output_0#/blocks.1/self_attn/Cast_3_output_0/blocks.1/self_attn/Cast_3"Cast* to (/blocks.1/self_attn/Constant_20_output_0/blocks.1/self_attn/Constant_20"Constant*G value*;B+/blocks.1/self_attn/Constant_20_attr::valueJ (/blocks.1/self_attn/Constant_21_output_0/blocks.1/self_attn/Constant_21"Constant*G value*;B+/blocks.1/self_attn/Constant_21_attr::valueJ (/blocks.1/self_attn/Constant_22_output_0/blocks.1/self_attn/Constant_22"Constant*G value*;B+/blocks.1/self_attn/Constant_22_attr::valueJ  #/blocks.1/self_attn/Cast_3_output_0 (/blocks.1/self_attn/Constant_22_output_0(/blocks.1/self_attn/Unsqueeze_8_output_0/blocks.1/self_attn/Unsqueeze_8" Unsqueeze (/blocks.1/self_attn/Constant_23_output_0/blocks.1/self_attn/Constant_23"Constant*G value*;B+/blocks.1/self_attn/Constant_23_attr::valueJ  */blocks.1/self_attn/k_norm/Cast_2_output_0 (/blocks.1/self_attn/Constant_21_output_0 (/blocks.1/self_attn/Unsqueeze_8_output_0 (/blocks.1/self_attn/Constant_20_output_0 (/blocks.1/self_attn/Constant_23_output_0$/blocks.1/self_attn/Slice_2_output_0/blocks.1/self_attn/Slice_2"Slice (/blocks.1/self_attn/Constant_24_output_0/blocks.1/self_attn/Constant_24"Constant*G value*;B+/blocks.1/self_attn/Constant_24_attr::valueJ (/blocks.1/self_attn/Constant_25_output_0/blocks.1/self_attn/Constant_25"Constant*G value*;B+/blocks.1/self_attn/Constant_25_attr::valueJ  #/blocks.1/self_attn/Cast_3_output_0 (/blocks.1/self_attn/Constant_25_output_0(/blocks.1/self_attn/Unsqueeze_9_output_0/blocks.1/self_attn/Unsqueeze_9" Unsqueeze (/blocks.1/self_attn/Constant_26_output_0/blocks.1/self_attn/Constant_26"Constant*G value*;B+/blocks.1/self_attn/Constant_26_attr::valueJ (/blocks.1/self_attn/Constant_27_output_0/blocks.1/self_attn/Constant_27"Constant*G value*;B+/blocks.1/self_attn/Constant_27_attr::valueJ  */blocks.1/self_attn/k_norm/Cast_2_output_0 (/blocks.1/self_attn/Unsqueeze_9_output_0 (/blocks.1/self_attn/Constant_26_output_0 (/blocks.1/self_attn/Constant_24_output_0 (/blocks.1/self_attn/Constant_27_output_0$/blocks.1/self_attn/Slice_3_output_0/blocks.1/self_attn/Slice_3"Slice j $/blocks.1/self_attn/Slice_3_output_0"/blocks.1/self_attn/Neg_1_output_0/blocks.1/self_attn/Neg_1"Neg  "/blocks.1/self_attn/Neg_1_output_0 $/blocks.1/self_attn/Slice_2_output_0%/blocks.1/self_attn/Concat_4_output_0/blocks.1/self_attn/Concat_4"Concat* axis  %/blocks.1/self_attn/Concat_4_output_0 %/blocks.0/self_attn/Gather_3_output_0"/blocks.1/self_attn/Mul_3_output_0/blocks.1/self_attn/Mul_3"Mul  "/blocks.1/self_attn/Mul_2_output_0 "/blocks.1/self_attn/Mul_3_output_0"/blocks.1/self_attn/Add_1_output_0/blocks.1/self_attn/Add_1"Add  /Gather_1_output_0 /rotary/Constant_3_output_0%/blocks.1/self_attn/Gather_4_output_0/blocks.1/self_attn/Gather_4"Gather* axis  /Gather_1_output_0 /rotary/Constant_8_output_0%/blocks.1/self_attn/Gather_5_output_0/blocks.1/self_attn/Gather_5"Gather* axis  %/blocks.1/self_attn/Gather_4_output_0 "/blocks.1/self_attn/Add_1_output_0%/blocks.1/self_attn/Concat_5_output_0/blocks.1/self_attn/Concat_5"Concat* axis  %/blocks.1/self_attn/Gather_5_output_0 &/blocks.1/self_attn/Reshape_2_output_0%/blocks.1/self_attn/Concat_6_output_0/blocks.1/self_attn/Concat_6"Concat* axis (/blocks.1/self_attn/Constant_28_output_0/blocks.1/self_attn/Constant_28"Constant*G value*;B+/blocks.1/self_attn/Constant_28_attr::valueJ  %/blocks.1/self_attn/Concat_5_output_0 (/blocks.1/self_attn/Constant_28_output_0)/blocks.1/self_attn/Unsqueeze_10_output_0 /blocks.1/self_attn/Unsqueeze_10" Unsqueeze (/blocks.1/self_attn/Constant_29_output_0/blocks.1/self_attn/Constant_29"Constant*G value*;B+/blocks.1/self_attn/Constant_29_attr::valueJ  %/blocks.1/self_attn/Concat_6_output_0 (/blocks.1/self_attn/Constant_29_output_0)/blocks.1/self_attn/Unsqueeze_11_output_0 /blocks.1/self_attn/Unsqueeze_11" Unsqueeze  )/blocks.1/self_attn/Unsqueeze_10_output_0 )/blocks.1/self_attn/Unsqueeze_11_output_0%/blocks.1/self_attn/Concat_7_output_0/blocks.1/self_attn/Concat_7"Concat* axis  /blocks.1/self_attn/Add_output_0&/blocks.1/self_attn/Transpose_output_0/blocks.1/self_attn/Transpose" Transpose* perm@@@@  %/blocks.1/self_attn/Concat_5_output_0(/blocks.1/self_attn/Transpose_1_output_0/blocks.1/self_attn/Transpose_1" Transpose* perm@@@@  %/blocks.1/self_attn/Concat_6_output_0(/blocks.1/self_attn/Transpose_2_output_0/blocks.1/self_attn/Transpose_2" Transpose* perm@@@@ t (/blocks.1/self_attn/Transpose_1_output_0$/blocks.1/self_attn/Shape_4_output_0/blocks.1/self_attn/Shape_4"Shape (/blocks.1/self_attn/Constant_30_output_0/blocks.1/self_attn/Constant_30"Constant*E value*9B+/blocks.1/self_attn/Constant_30_attr::valueJ  $/blocks.1/self_attn/Shape_4_output_0 (/blocks.1/self_attn/Constant_30_output_0%/blocks.1/self_attn/Gather_6_output_0/blocks.1/self_attn/Gather_6"Gather* axis t (/blocks.1/self_attn/Transpose_1_output_0$/blocks.1/self_attn/Shape_5_output_0/blocks.1/self_attn/Shape_5"Shape (/blocks.1/self_attn/Constant_31_output_0/blocks.1/self_attn/Constant_31"Constant*E value*9B+/blocks.1/self_attn/Constant_31_attr::valueJ  $/blocks.1/self_attn/Shape_5_output_0 (/blocks.1/self_attn/Constant_31_output_0%/blocks.1/self_attn/Gather_7_output_0/blocks.1/self_attn/Gather_7"Gather* axis t (/blocks.1/self_attn/Transpose_1_output_0$/blocks.1/self_attn/Shape_6_output_0/blocks.1/self_attn/Shape_6"Shape (/blocks.1/self_attn/Constant_32_output_0/blocks.1/self_attn/Constant_32"Constant*E value*9B+/blocks.1/self_attn/Constant_32_attr::valueJ  $/blocks.1/self_attn/Shape_6_output_0 (/blocks.1/self_attn/Constant_32_output_0%/blocks.1/self_attn/Gather_8_output_0/blocks.1/self_attn/Gather_8"Gather* axis t (/blocks.1/self_attn/Transpose_1_output_0$/blocks.1/self_attn/Shape_7_output_0/blocks.1/self_attn/Shape_7"Shape (/blocks.1/self_attn/Constant_33_output_0/blocks.1/self_attn/Constant_33"Constant*E value*9B+/blocks.1/self_attn/Constant_33_attr::valueJ  $/blocks.1/self_attn/Shape_7_output_0 (/blocks.1/self_attn/Constant_33_output_0%/blocks.1/self_attn/Gather_9_output_0/blocks.1/self_attn/Gather_9"Gather* axis (/blocks.1/self_attn/Constant_34_output_0/blocks.1/self_attn/Constant_34"Constant*G value*;B+/blocks.1/self_attn/Constant_34_attr::valueJ  (/blocks.1/self_attn/Transpose_1_output_0 (/blocks.1/self_attn/Constant_34_output_0)/blocks.1/self_attn/Unsqueeze_12_output_0 /blocks.1/self_attn/Unsqueeze_12" Unsqueeze (/blocks.1/self_attn/Constant_35_output_0/blocks.1/self_attn/Constant_35"Constant*G value*;B+/blocks.1/self_attn/Constant_35_attr::valueJ  %/blocks.1/self_attn/Gather_6_output_0 (/blocks.1/self_attn/Constant_35_output_0)/blocks.1/self_attn/Unsqueeze_13_output_0 /blocks.1/self_attn/Unsqueeze_13" Unsqueeze (/blocks.1/self_attn/Constant_36_output_0/blocks.1/self_attn/Constant_36"Constant*G value*;B+/blocks.1/self_attn/Constant_36_attr::valueJ  %/blocks.1/self_attn/Gather_7_output_0 (/blocks.1/self_attn/Constant_36_output_0)/blocks.1/self_attn/Unsqueeze_14_output_0 /blocks.1/self_attn/Unsqueeze_14" Unsqueeze (/blocks.1/self_attn/Constant_37_output_0/blocks.1/self_attn/Constant_37"Constant*G value*;B+/blocks.1/self_attn/Constant_37_attr::valueJ (/blocks.1/self_attn/Constant_38_output_0/blocks.1/self_attn/Constant_38"Constant*G value*;B+/blocks.1/self_attn/Constant_38_attr::valueJ  %/blocks.1/self_attn/Gather_8_output_0 (/blocks.1/self_attn/Constant_38_output_0)/blocks.1/self_attn/Unsqueeze_15_output_0 /blocks.1/self_attn/Unsqueeze_15" Unsqueeze (/blocks.1/self_attn/Constant_39_output_0/blocks.1/self_attn/Constant_39"Constant*G value*;B+/blocks.1/self_attn/Constant_39_attr::valueJ  %/blocks.1/self_attn/Gather_9_output_0 (/blocks.1/self_attn/Constant_39_output_0)/blocks.1/self_attn/Unsqueeze_16_output_0 /blocks.1/self_attn/Unsqueeze_16" Unsqueeze  )/blocks.1/self_attn/Unsqueeze_13_output_0 )/blocks.1/self_attn/Unsqueeze_14_output_0 (/blocks.1/self_attn/Constant_37_output_0 )/blocks.1/self_attn/Unsqueeze_15_output_0 )/blocks.1/self_attn/Unsqueeze_16_output_0%/blocks.1/self_attn/Concat_8_output_0/blocks.1/self_attn/Concat_8"Concat* axis (/blocks.1/self_attn/Constant_40_output_0/blocks.1/self_attn/Constant_40"Constant*G value*;B+/blocks.1/self_attn/Constant_40_attr::valueJ  %/blocks.1/self_attn/Concat_8_output_0 (/blocks.1/self_attn/Constant_40_output_0&/blocks.1/self_attn/Reshape_3_output_0/blocks.1/self_attn/Reshape_3"Reshape* allowzero r &/blocks.1/self_attn/Reshape_3_output_0$/blocks.1/self_attn/Shape_8_output_0/blocks.1/self_attn/Shape_8"Shape  $/blocks.1/self_attn/Shape_8_output_0,/blocks.1/self_attn/ConstantOfShape_output_0#/blocks.1/self_attn/ConstantOfShape"ConstantOfShape*K value*?B//blocks.1/self_attn/ConstantOfShape_attr::valueJ (/blocks.1/self_attn/Constant_41_output_0/blocks.1/self_attn/Constant_41"Constant*E value*9B+/blocks.1/self_attn/Constant_41_attr::valueJ  ,/blocks.1/self_attn/ConstantOfShape_output_0 (/blocks.1/self_attn/Constant_41_output_0"/blocks.1/self_attn/Mul_4_output_0/blocks.1/self_attn/Mul_4"Mul  &/blocks.1/self_attn/Reshape_3_output_0 "/blocks.1/self_attn/Mul_4_output_0"/blocks.1/self_attn/Equal_output_0/blocks.1/self_attn/Equal"Equal  "/blocks.1/self_attn/Equal_output_0 ,/blocks.1/self_attn/ConstantOfShape_output_0 &/blocks.1/self_attn/Reshape_3_output_0"/blocks.1/self_attn/Where_output_0/blocks.1/self_attn/Where"Where  )/blocks.1/self_attn/Unsqueeze_12_output_0 "/blocks.1/self_attn/Where_output_0#/blocks.1/self_attn/Expand_output_0/blocks.1/self_attn/Expand"Expand (/blocks.1/self_attn/Constant_42_output_0/blocks.1/self_attn/Constant_42"Constant*E value*9B+/blocks.1/self_attn/Constant_42_attr::valueJ  %/blocks.1/self_attn/Gather_7_output_0 (/blocks.1/self_attn/Constant_42_output_0"/blocks.1/self_attn/Mul_5_output_0/blocks.1/self_attn/Mul_5"Mul eonnx::Unsqueeze_828 Constant_2963"Constant*5 value*)BConstant_2963_attr::valueJ  %/blocks.1/self_attn/Gather_6_output_0 onnx::Unsqueeze_828)/blocks.1/self_attn/Unsqueeze_17_output_0 /blocks.1/self_attn/Unsqueeze_17" Unsqueeze eonnx::Unsqueeze_830 Constant_2965"Constant*5 value*)BConstant_2965_attr::valueJ  "/blocks.1/self_attn/Mul_5_output_0 onnx::Unsqueeze_830)/blocks.1/self_attn/Unsqueeze_18_output_0 /blocks.1/self_attn/Unsqueeze_18" Unsqueeze eonnx::Unsqueeze_832 Constant_2967"Constant*5 value*)BConstant_2967_attr::valueJ  %/blocks.1/self_attn/Gather_8_output_0 onnx::Unsqueeze_832)/blocks.1/self_attn/Unsqueeze_19_output_0 /blocks.1/self_attn/Unsqueeze_19" Unsqueeze eonnx::Unsqueeze_834 Constant_2969"Constant*5 value*)BConstant_2969_attr::valueJ  %/blocks.1/self_attn/Gather_9_output_0 onnx::Unsqueeze_834)/blocks.1/self_attn/Unsqueeze_20_output_0 /blocks.1/self_attn/Unsqueeze_20" Unsqueeze  )/blocks.1/self_attn/Unsqueeze_17_output_0 )/blocks.1/self_attn/Unsqueeze_18_output_0 )/blocks.1/self_attn/Unsqueeze_19_output_0 )/blocks.1/self_attn/Unsqueeze_20_output_0%/blocks.1/self_attn/Concat_9_output_0/blocks.1/self_attn/Concat_9"Concat* axis  #/blocks.1/self_attn/Expand_output_0 %/blocks.1/self_attn/Concat_9_output_0&/blocks.1/self_attn/Reshape_4_output_0/blocks.1/self_attn/Reshape_4"Reshape* allowzero t (/blocks.1/self_attn/Transpose_2_output_0$/blocks.1/self_attn/Shape_9_output_0/blocks.1/self_attn/Shape_9"Shape (/blocks.1/self_attn/Constant_43_output_0/blocks.1/self_attn/Constant_43"Constant*E value*9B+/blocks.1/self_attn/Constant_43_attr::valueJ  $/blocks.1/self_attn/Shape_9_output_0 (/blocks.1/self_attn/Constant_43_output_0&/blocks.1/self_attn/Gather_10_output_0/blocks.1/self_attn/Gather_10"Gather* axis v (/blocks.1/self_attn/Transpose_2_output_0%/blocks.1/self_attn/Shape_10_output_0/blocks.1/self_attn/Shape_10"Shape (/blocks.1/self_attn/Constant_44_output_0/blocks.1/self_attn/Constant_44"Constant*E value*9B+/blocks.1/self_attn/Constant_44_attr::valueJ  %/blocks.1/self_attn/Shape_10_output_0 (/blocks.1/self_attn/Constant_44_output_0&/blocks.1/self_attn/Gather_11_output_0/blocks.1/self_attn/Gather_11"Gather* axis v (/blocks.1/self_attn/Transpose_2_output_0%/blocks.1/self_attn/Shape_11_output_0/blocks.1/self_attn/Shape_11"Shape (/blocks.1/self_attn/Constant_45_output_0/blocks.1/self_attn/Constant_45"Constant*E value*9B+/blocks.1/self_attn/Constant_45_attr::valueJ  %/blocks.1/self_attn/Shape_11_output_0 (/blocks.1/self_attn/Constant_45_output_0&/blocks.1/self_attn/Gather_12_output_0/blocks.1/self_attn/Gather_12"Gather* axis v (/blocks.1/self_attn/Transpose_2_output_0%/blocks.1/self_attn/Shape_12_output_0/blocks.1/self_attn/Shape_12"Shape (/blocks.1/self_attn/Constant_46_output_0/blocks.1/self_attn/Constant_46"Constant*E value*9B+/blocks.1/self_attn/Constant_46_attr::valueJ  %/blocks.1/self_attn/Shape_12_output_0 (/blocks.1/self_attn/Constant_46_output_0&/blocks.1/self_attn/Gather_13_output_0/blocks.1/self_attn/Gather_13"Gather* axis (/blocks.1/self_attn/Constant_47_output_0/blocks.1/self_attn/Constant_47"Constant*G value*;B+/blocks.1/self_attn/Constant_47_attr::valueJ  (/blocks.1/self_attn/Transpose_2_output_0 (/blocks.1/self_attn/Constant_47_output_0)/blocks.1/self_attn/Unsqueeze_21_output_0 /blocks.1/self_attn/Unsqueeze_21" Unsqueeze (/blocks.1/self_attn/Constant_48_output_0/blocks.1/self_attn/Constant_48"Constant*G value*;B+/blocks.1/self_attn/Constant_48_attr::valueJ  &/blocks.1/self_attn/Gather_10_output_0 (/blocks.1/self_attn/Constant_48_output_0)/blocks.1/self_attn/Unsqueeze_22_output_0 /blocks.1/self_attn/Unsqueeze_22" Unsqueeze (/blocks.1/self_attn/Constant_49_output_0/blocks.1/self_attn/Constant_49"Constant*G value*;B+/blocks.1/self_attn/Constant_49_attr::valueJ  &/blocks.1/self_attn/Gather_11_output_0 (/blocks.1/self_attn/Constant_49_output_0)/blocks.1/self_attn/Unsqueeze_23_output_0 /blocks.1/self_attn/Unsqueeze_23" Unsqueeze (/blocks.1/self_attn/Constant_50_output_0/blocks.1/self_attn/Constant_50"Constant*G value*;B+/blocks.1/self_attn/Constant_50_attr::valueJ (/blocks.1/self_attn/Constant_51_output_0/blocks.1/self_attn/Constant_51"Constant*G value*;B+/blocks.1/self_attn/Constant_51_attr::valueJ  &/blocks.1/self_attn/Gather_12_output_0 (/blocks.1/self_attn/Constant_51_output_0)/blocks.1/self_attn/Unsqueeze_24_output_0 /blocks.1/self_attn/Unsqueeze_24" Unsqueeze (/blocks.1/self_attn/Constant_52_output_0/blocks.1/self_attn/Constant_52"Constant*G value*;B+/blocks.1/self_attn/Constant_52_attr::valueJ  &/blocks.1/self_attn/Gather_13_output_0 (/blocks.1/self_attn/Constant_52_output_0)/blocks.1/self_attn/Unsqueeze_25_output_0 /blocks.1/self_attn/Unsqueeze_25" Unsqueeze  )/blocks.1/self_attn/Unsqueeze_22_output_0 )/blocks.1/self_attn/Unsqueeze_23_output_0 (/blocks.1/self_attn/Constant_50_output_0 )/blocks.1/self_attn/Unsqueeze_24_output_0 )/blocks.1/self_attn/Unsqueeze_25_output_0&/blocks.1/self_attn/Concat_10_output_0/blocks.1/self_attn/Concat_10"Concat* axis (/blocks.1/self_attn/Constant_53_output_0/blocks.1/self_attn/Constant_53"Constant*G value*;B+/blocks.1/self_attn/Constant_53_attr::valueJ  &/blocks.1/self_attn/Concat_10_output_0 (/blocks.1/self_attn/Constant_53_output_0&/blocks.1/self_attn/Reshape_5_output_0/blocks.1/self_attn/Reshape_5"Reshape* allowzero t &/blocks.1/self_attn/Reshape_5_output_0%/blocks.1/self_attn/Shape_13_output_0/blocks.1/self_attn/Shape_13"Shape  %/blocks.1/self_attn/Shape_13_output_0./blocks.1/self_attn/ConstantOfShape_1_output_0%/blocks.1/self_attn/ConstantOfShape_1"ConstantOfShape*M value*AB1/blocks.1/self_attn/ConstantOfShape_1_attr::valueJ (/blocks.1/self_attn/Constant_54_output_0/blocks.1/self_attn/Constant_54"Constant*E value*9B+/blocks.1/self_attn/Constant_54_attr::valueJ  ./blocks.1/self_attn/ConstantOfShape_1_output_0 (/blocks.1/self_attn/Constant_54_output_0"/blocks.1/self_attn/Mul_6_output_0/blocks.1/self_attn/Mul_6"Mul  &/blocks.1/self_attn/Reshape_5_output_0 "/blocks.1/self_attn/Mul_6_output_0$/blocks.1/self_attn/Equal_1_output_0/blocks.1/self_attn/Equal_1"Equal  $/blocks.1/self_attn/Equal_1_output_0 ./blocks.1/self_attn/ConstantOfShape_1_output_0 &/blocks.1/self_attn/Reshape_5_output_0$/blocks.1/self_attn/Where_1_output_0/blocks.1/self_attn/Where_1"Where  )/blocks.1/self_attn/Unsqueeze_21_output_0 $/blocks.1/self_attn/Where_1_output_0%/blocks.1/self_attn/Expand_1_output_0/blocks.1/self_attn/Expand_1"Expand (/blocks.1/self_attn/Constant_55_output_0/blocks.1/self_attn/Constant_55"Constant*E value*9B+/blocks.1/self_attn/Constant_55_attr::valueJ  &/blocks.1/self_attn/Gather_11_output_0 (/blocks.1/self_attn/Constant_55_output_0"/blocks.1/self_attn/Mul_7_output_0/blocks.1/self_attn/Mul_7"Mul eonnx::Unsqueeze_874 Constant_3008"Constant*5 value*)BConstant_3008_attr::valueJ  &/blocks.1/self_attn/Gather_10_output_0 onnx::Unsqueeze_874)/blocks.1/self_attn/Unsqueeze_26_output_0 /blocks.1/self_attn/Unsqueeze_26" Unsqueeze eonnx::Unsqueeze_876 Constant_3010"Constant*5 value*)BConstant_3010_attr::valueJ  "/blocks.1/self_attn/Mul_7_output_0 onnx::Unsqueeze_876)/blocks.1/self_attn/Unsqueeze_27_output_0 /blocks.1/self_attn/Unsqueeze_27" Unsqueeze eonnx::Unsqueeze_878 Constant_3012"Constant*5 value*)BConstant_3012_attr::valueJ  &/blocks.1/self_attn/Gather_12_output_0 onnx::Unsqueeze_878)/blocks.1/self_attn/Unsqueeze_28_output_0 /blocks.1/self_attn/Unsqueeze_28" Unsqueeze eonnx::Unsqueeze_880 Constant_3014"Constant*5 value*)BConstant_3014_attr::valueJ  &/blocks.1/self_attn/Gather_13_output_0 onnx::Unsqueeze_880)/blocks.1/self_attn/Unsqueeze_29_output_0 /blocks.1/self_attn/Unsqueeze_29" Unsqueeze  )/blocks.1/self_attn/Unsqueeze_26_output_0 )/blocks.1/self_attn/Unsqueeze_27_output_0 )/blocks.1/self_attn/Unsqueeze_28_output_0 )/blocks.1/self_attn/Unsqueeze_29_output_0&/blocks.1/self_attn/Concat_11_output_0/blocks.1/self_attn/Concat_11"Concat* axis  %/blocks.1/self_attn/Expand_1_output_0 &/blocks.1/self_attn/Concat_11_output_0&/blocks.1/self_attn/Reshape_6_output_0/blocks.1/self_attn/Reshape_6"Reshape* allowzero  &/blocks.1/self_attn/Transpose_output_0 &/blocks.1/self_attn/Reshape_4_output_0#/blocks.1/self_attn/MatMul_output_0/blocks.1/self_attn/MatMul"MatMul (/blocks.1/self_attn/Constant_56_output_0/blocks.1/self_attn/Constant_56"Constant*A value*5B+/blocks.1/self_attn/Constant_56_attr::valueJ5A  #/blocks.1/self_attn/MatMul_output_0 (/blocks.1/self_attn/Constant_56_output_0"/blocks.1/self_attn/Div_2_output_0/blocks.1/self_attn/Div_2"Div x "/blocks.1/self_attn/Div_2_output_0 attention_mask"/blocks.1/self_attn/Add_2_output_0/blocks.1/self_attn/Add_2"Add  "/blocks.1/self_attn/Add_2_output_0$/blocks.1/self_attn/Softmax_output_0/blocks.1/self_attn/Softmax"Softmax* axis x $/blocks.1/self_attn/Softmax_output_0#/blocks.1/self_attn/Cast_4_output_0/blocks.1/self_attn/Cast_4"Cast* to  #/blocks.1/self_attn/Cast_4_output_0 &/blocks.1/self_attn/Reshape_6_output_0%/blocks.1/self_attn/MatMul_1_output_0/blocks.1/self_attn/MatMul_1"MatMul  %/blocks.1/self_attn/MatMul_1_output_0(/blocks.1/self_attn/Transpose_3_output_0/blocks.1/self_attn/Transpose_3" Transpose* perm@@@@ eonnx::Unsqueeze_892 Constant_3026"Constant*5 value*)BConstant_3026_attr::valueJ  #/blocks.1/self_attn/Gather_output_0 onnx::Unsqueeze_892)/blocks.1/self_attn/Unsqueeze_30_output_0 /blocks.1/self_attn/Unsqueeze_30" Unsqueeze eonnx::Unsqueeze_894 Constant_3028"Constant*5 value*)BConstant_3028_attr::valueJ  %/blocks.1/self_attn/Gather_1_output_0 onnx::Unsqueeze_894)/blocks.1/self_attn/Unsqueeze_31_output_0 /blocks.1/self_attn/Unsqueeze_31" Unsqueeze (/blocks.1/self_attn/Constant_57_output_0/blocks.1/self_attn/Constant_57"Constant*G value*;B+/blocks.1/self_attn/Constant_57_attr::valueJ  )/blocks.1/self_attn/Unsqueeze_30_output_0 )/blocks.1/self_attn/Unsqueeze_31_output_0 (/blocks.1/self_attn/Constant_57_output_0&/blocks.1/self_attn/Concat_12_output_0/blocks.1/self_attn/Concat_12"Concat* axis  (/blocks.1/self_attn/Transpose_3_output_0 &/blocks.1/self_attn/Concat_12_output_0&/blocks.1/self_attn/Reshape_7_output_0/blocks.1/self_attn/Reshape_7"Reshape* allowzero  &/blocks.1/self_attn/Reshape_7_output_0 onnx::MatMul_8617*/blocks.1/self_attn/o_proj/MatMul_output_0!/blocks.1/self_attn/o_proj/MatMul"MatMul  )/blocks.1/input_layernorm/Cast_1_output_0 */blocks.1/self_attn/o_proj/MatMul_output_0/blocks.1/Add_output_0 /blocks.1/Add"Add  /blocks.1/Add_output_00/blocks.1/post_attention_layernorm/Cast_output_0'/blocks.1/post_attention_layernorm/Cast"Cast* to 4/blocks.1/post_attention_layernorm/Constant_output_0+/blocks.1/post_attention_layernorm/Constant"Constant*M value*AB7/blocks.1/post_attention_layernorm/Constant_attr::valueJ@  0/blocks.1/post_attention_layernorm/Cast_output_0 4/blocks.1/post_attention_layernorm/Constant_output_0//blocks.1/post_attention_layernorm/Pow_output_0&/blocks.1/post_attention_layernorm/Pow"Pow  //blocks.1/post_attention_layernorm/Pow_output_06/blocks.1/post_attention_layernorm/ReduceMean_output_0-/blocks.1/post_attention_layernorm/ReduceMean" ReduceMean* axes@* keepdims 6/blocks.1/post_attention_layernorm/Constant_1_output_0-/blocks.1/post_attention_layernorm/Constant_1"Constant*O value*CB9/blocks.1/post_attention_layernorm/Constant_1_attr::valueJ75  6/blocks.1/post_attention_layernorm/ReduceMean_output_0 6/blocks.1/post_attention_layernorm/Constant_1_output_0//blocks.1/post_attention_layernorm/Add_output_0&/blocks.1/post_attention_layernorm/Add"Add  //blocks.1/post_attention_layernorm/Add_output_00/blocks.1/post_attention_layernorm/Sqrt_output_0'/blocks.1/post_attention_layernorm/Sqrt"Sqrt 6/blocks.1/post_attention_layernorm/Constant_2_output_0-/blocks.1/post_attention_layernorm/Constant_2"Constant*O value*CB9/blocks.1/post_attention_layernorm/Constant_2_attr::valueJ?  6/blocks.1/post_attention_layernorm/Constant_2_output_0 0/blocks.1/post_attention_layernorm/Sqrt_output_0//blocks.1/post_attention_layernorm/Div_output_0&/blocks.1/post_attention_layernorm/Div"Div  0/blocks.1/post_attention_layernorm/Cast_output_02/blocks.1/post_attention_layernorm/Cast_1_output_0)/blocks.1/post_attention_layernorm/Cast_1"Cast* to  2/blocks.1/post_attention_layernorm/Cast_1_output_0 //blocks.1/post_attention_layernorm/Div_output_0//blocks.1/post_attention_layernorm/Mul_output_0&/blocks.1/post_attention_layernorm/Mul"Mul  //blocks.1/post_attention_layernorm/Mul_output_0 (blocks.1.post_attention_layernorm.weight1/blocks.1/post_attention_layernorm/Mul_1_output_0(/blocks.1/post_attention_layernorm/Mul_1"Mul  1/blocks.1/post_attention_layernorm/Mul_1_output_02/blocks.1/post_attention_layernorm/Cast_2_output_0)/blocks.1/post_attention_layernorm/Cast_2"Cast* to  2/blocks.1/post_attention_layernorm/Cast_2_output_0 onnx::MatMul_8618'/blocks.1/mlp/gate_proj/MatMul_output_0/blocks.1/mlp/gate_proj/MatMul"MatMul w '/blocks.1/mlp/gate_proj/MatMul_output_0%/blocks.1/mlp/act_fn/Sigmoid_output_0/blocks.1/mlp/act_fn/Sigmoid"Sigmoid  '/blocks.1/mlp/gate_proj/MatMul_output_0 %/blocks.1/mlp/act_fn/Sigmoid_output_0!/blocks.1/mlp/act_fn/Mul_output_0/blocks.1/mlp/act_fn/Mul"Mul  2/blocks.1/post_attention_layernorm/Cast_2_output_0 onnx::MatMul_8619%/blocks.1/mlp/up_proj/MatMul_output_0/blocks.1/mlp/up_proj/MatMul"MatMul ~ !/blocks.1/mlp/act_fn/Mul_output_0 %/blocks.1/mlp/up_proj/MatMul_output_0/blocks.1/mlp/Mul_output_0/blocks.1/mlp/Mul"Mul  /blocks.1/mlp/Mul_output_0 onnx::MatMul_8620'/blocks.1/mlp/down_proj/MatMul_output_0/blocks.1/mlp/down_proj/MatMul"MatMul  2/blocks.1/post_attention_layernorm/Cast_1_output_0 '/blocks.1/mlp/down_proj/MatMul_output_0/blocks.1/Add_1_output_0/blocks.1/Add_1"Add b past_key_values /rotary/Constant_6_output_0/Gather_2_output_0 /Gather_2"Gather* axis /blocks.2/Constant_output_0/blocks.2/Constant"Constant*J value*>B/blocks.2/Constant_attr::valueJ  /blocks.1/Add_1_output_0 /blocks.2/Constant_output_0/blocks.2/Reshape_output_0/blocks.2/Reshape"Reshape* allowzero v /blocks.2/Reshape_output_0'/blocks.2/input_layernorm/Cast_output_0/blocks.2/input_layernorm/Cast"Cast* to +/blocks.2/input_layernorm/Constant_output_0"/blocks.2/input_layernorm/Constant"Constant*D value*8B./blocks.2/input_layernorm/Constant_attr::valueJ@  '/blocks.2/input_layernorm/Cast_output_0 +/blocks.2/input_layernorm/Constant_output_0&/blocks.2/input_layernorm/Pow_output_0/blocks.2/input_layernorm/Pow"Pow  &/blocks.2/input_layernorm/Pow_output_0-/blocks.2/input_layernorm/ReduceMean_output_0$/blocks.2/input_layernorm/ReduceMean" ReduceMean* axes@* keepdims -/blocks.2/input_layernorm/Constant_1_output_0$/blocks.2/input_layernorm/Constant_1"Constant*F value*:B0/blocks.2/input_layernorm/Constant_1_attr::valueJ75  -/blocks.2/input_layernorm/ReduceMean_output_0 -/blocks.2/input_layernorm/Constant_1_output_0&/blocks.2/input_layernorm/Add_output_0/blocks.2/input_layernorm/Add"Add w &/blocks.2/input_layernorm/Add_output_0'/blocks.2/input_layernorm/Sqrt_output_0/blocks.2/input_layernorm/Sqrt"Sqrt -/blocks.2/input_layernorm/Constant_2_output_0$/blocks.2/input_layernorm/Constant_2"Constant*F value*:B0/blocks.2/input_layernorm/Constant_2_attr::valueJ?  -/blocks.2/input_layernorm/Constant_2_output_0 '/blocks.2/input_layernorm/Sqrt_output_0&/blocks.2/input_layernorm/Div_output_0/blocks.2/input_layernorm/Div"Div  '/blocks.2/input_layernorm/Cast_output_0)/blocks.2/input_layernorm/Cast_1_output_0 /blocks.2/input_layernorm/Cast_1"Cast* to  )/blocks.2/input_layernorm/Cast_1_output_0 &/blocks.2/input_layernorm/Div_output_0&/blocks.2/input_layernorm/Mul_output_0/blocks.2/input_layernorm/Mul"Mul  &/blocks.2/input_layernorm/Mul_output_0 blocks.2.input_layernorm.weight(/blocks.2/input_layernorm/Mul_1_output_0/blocks.2/input_layernorm/Mul_1"Mul  (/blocks.2/input_layernorm/Mul_1_output_0)/blocks.2/input_layernorm/Cast_2_output_0 /blocks.2/input_layernorm/Cast_2"Cast* to q )/blocks.2/input_layernorm/Cast_2_output_0"/blocks.2/self_attn/Shape_output_0/blocks.2/self_attn/Shape"Shape %/blocks.2/self_attn/Constant_output_0/blocks.2/self_attn/Constant"Constant*B value*6B(/blocks.2/self_attn/Constant_attr::valueJ  "/blocks.2/self_attn/Shape_output_0 %/blocks.2/self_attn/Constant_output_0#/blocks.2/self_attn/Gather_output_0/blocks.2/self_attn/Gather"Gather* axis u )/blocks.2/input_layernorm/Cast_2_output_0$/blocks.2/self_attn/Shape_1_output_0/blocks.2/self_attn/Shape_1"Shape '/blocks.2/self_attn/Constant_1_output_0/blocks.2/self_attn/Constant_1"Constant*D value*8B*/blocks.2/self_attn/Constant_1_attr::valueJ  $/blocks.2/self_attn/Shape_1_output_0 '/blocks.2/self_attn/Constant_1_output_0%/blocks.2/self_attn/Gather_1_output_0/blocks.2/self_attn/Gather_1"Gather* axis  )/blocks.2/input_layernorm/Cast_2_output_0 onnx::MatMul_8621*/blocks.2/self_attn/q_proj/MatMul_output_0!/blocks.2/self_attn/q_proj/MatMul"MatMul  )/blocks.2/input_layernorm/Cast_2_output_0 onnx::MatMul_8622*/blocks.2/self_attn/k_proj/MatMul_output_0!/blocks.2/self_attn/k_proj/MatMul"MatMul  )/blocks.2/input_layernorm/Cast_2_output_0 onnx::MatMul_8623*/blocks.2/self_attn/v_proj/MatMul_output_0!/blocks.2/self_attn/v_proj/MatMul"MatMul eonnx::Unsqueeze_954 Constant_3080"Constant*5 value*)BConstant_3080_attr::valueJ  #/blocks.2/self_attn/Gather_output_0 onnx::Unsqueeze_954&/blocks.2/self_attn/Unsqueeze_output_0/blocks.2/self_attn/Unsqueeze" Unsqueeze eonnx::Unsqueeze_956 Constant_3082"Constant*5 value*)BConstant_3082_attr::valueJ  %/blocks.2/self_attn/Gather_1_output_0 onnx::Unsqueeze_956(/blocks.2/self_attn/Unsqueeze_1_output_0/blocks.2/self_attn/Unsqueeze_1" Unsqueeze '/blocks.2/self_attn/Constant_2_output_0/blocks.2/self_attn/Constant_2"Constant*F value*:B*/blocks.2/self_attn/Constant_2_attr::valueJ '/blocks.2/self_attn/Constant_3_output_0/blocks.2/self_attn/Constant_3"Constant*F value*:B*/blocks.2/self_attn/Constant_3_attr::valueJ  &/blocks.2/self_attn/Unsqueeze_output_0 (/blocks.2/self_attn/Unsqueeze_1_output_0 '/blocks.2/self_attn/Constant_2_output_0 '/blocks.2/self_attn/Constant_3_output_0#/blocks.2/self_attn/Concat_output_0/blocks.2/self_attn/Concat"Concat* axis  */blocks.2/self_attn/q_proj/MatMul_output_0 #/blocks.2/self_attn/Concat_output_0$/blocks.2/self_attn/Reshape_output_0/blocks.2/self_attn/Reshape"Reshape* allowzero eonnx::Unsqueeze_964 Constant_3088"Constant*5 value*)BConstant_3088_attr::valueJ  #/blocks.2/self_attn/Gather_output_0 onnx::Unsqueeze_964(/blocks.2/self_attn/Unsqueeze_2_output_0/blocks.2/self_attn/Unsqueeze_2" Unsqueeze eonnx::Unsqueeze_966 Constant_3090"Constant*5 value*)BConstant_3090_attr::valueJ  %/blocks.2/self_attn/Gather_1_output_0 onnx::Unsqueeze_966(/blocks.2/self_attn/Unsqueeze_3_output_0/blocks.2/self_attn/Unsqueeze_3" Unsqueeze '/blocks.2/self_attn/Constant_4_output_0/blocks.2/self_attn/Constant_4"Constant*F value*:B*/blocks.2/self_attn/Constant_4_attr::valueJ '/blocks.2/self_attn/Constant_5_output_0/blocks.2/self_attn/Constant_5"Constant*F value*:B*/blocks.2/self_attn/Constant_5_attr::valueJ  (/blocks.2/self_attn/Unsqueeze_2_output_0 (/blocks.2/self_attn/Unsqueeze_3_output_0 '/blocks.2/self_attn/Constant_4_output_0 '/blocks.2/self_attn/Constant_5_output_0%/blocks.2/self_attn/Concat_1_output_0/blocks.2/self_attn/Concat_1"Concat* axis eonnx::Unsqueeze_973 Constant_3095"Constant*5 value*)BConstant_3095_attr::valueJ  #/blocks.2/self_attn/Gather_output_0 onnx::Unsqueeze_973(/blocks.2/self_attn/Unsqueeze_4_output_0/blocks.2/self_attn/Unsqueeze_4" Unsqueeze eonnx::Unsqueeze_975 Constant_3097"Constant*5 value*)BConstant_3097_attr::valueJ  %/blocks.2/self_attn/Gather_1_output_0 onnx::Unsqueeze_975(/blocks.2/self_attn/Unsqueeze_5_output_0/blocks.2/self_attn/Unsqueeze_5" Unsqueeze '/blocks.2/self_attn/Constant_6_output_0/blocks.2/self_attn/Constant_6"Constant*F value*:B*/blocks.2/self_attn/Constant_6_attr::valueJ '/blocks.2/self_attn/Constant_7_output_0/blocks.2/self_attn/Constant_7"Constant*F value*:B*/blocks.2/self_attn/Constant_7_attr::valueJ  (/blocks.2/self_attn/Unsqueeze_4_output_0 (/blocks.2/self_attn/Unsqueeze_5_output_0 '/blocks.2/self_attn/Constant_6_output_0 '/blocks.2/self_attn/Constant_7_output_0%/blocks.2/self_attn/Concat_2_output_0/blocks.2/self_attn/Concat_2"Concat* axis  */blocks.2/self_attn/k_proj/MatMul_output_0 %/blocks.2/self_attn/Concat_1_output_0&/blocks.2/self_attn/Reshape_1_output_0/blocks.2/self_attn/Reshape_1"Reshape* allowzero  */blocks.2/self_attn/v_proj/MatMul_output_0 %/blocks.2/self_attn/Concat_2_output_0&/blocks.2/self_attn/Reshape_2_output_0/blocks.2/self_attn/Reshape_2"Reshape* allowzero  $/blocks.2/self_attn/Reshape_output_0(/blocks.2/self_attn/q_norm/Cast_output_0/blocks.2/self_attn/q_norm/Cast"Cast* to ,/blocks.2/self_attn/q_norm/Constant_output_0#/blocks.2/self_attn/q_norm/Constant"Constant*E value*9B//blocks.2/self_attn/q_norm/Constant_attr::valueJ@  (/blocks.2/self_attn/q_norm/Cast_output_0 ,/blocks.2/self_attn/q_norm/Constant_output_0'/blocks.2/self_attn/q_norm/Pow_output_0/blocks.2/self_attn/q_norm/Pow"Pow  '/blocks.2/self_attn/q_norm/Pow_output_0./blocks.2/self_attn/q_norm/ReduceMean_output_0%/blocks.2/self_attn/q_norm/ReduceMean" ReduceMean* axes@* keepdims ./blocks.2/self_attn/q_norm/Constant_1_output_0%/blocks.2/self_attn/q_norm/Constant_1"Constant*G value*;B1/blocks.2/self_attn/q_norm/Constant_1_attr::valueJ75  ./blocks.2/self_attn/q_norm/ReduceMean_output_0 ./blocks.2/self_attn/q_norm/Constant_1_output_0'/blocks.2/self_attn/q_norm/Add_output_0/blocks.2/self_attn/q_norm/Add"Add z '/blocks.2/self_attn/q_norm/Add_output_0(/blocks.2/self_attn/q_norm/Sqrt_output_0/blocks.2/self_attn/q_norm/Sqrt"Sqrt ./blocks.2/self_attn/q_norm/Constant_2_output_0%/blocks.2/self_attn/q_norm/Constant_2"Constant*G value*;B1/blocks.2/self_attn/q_norm/Constant_2_attr::valueJ?  ./blocks.2/self_attn/q_norm/Constant_2_output_0 (/blocks.2/self_attn/q_norm/Sqrt_output_0'/blocks.2/self_attn/q_norm/Div_output_0/blocks.2/self_attn/q_norm/Div"Div  (/blocks.2/self_attn/q_norm/Cast_output_0*/blocks.2/self_attn/q_norm/Cast_1_output_0!/blocks.2/self_attn/q_norm/Cast_1"Cast* to  */blocks.2/self_attn/q_norm/Cast_1_output_0 '/blocks.2/self_attn/q_norm/Div_output_0'/blocks.2/self_attn/q_norm/Mul_output_0/blocks.2/self_attn/q_norm/Mul"Mul  '/blocks.2/self_attn/q_norm/Mul_output_0 blocks.2.self_attn.q_norm.weight)/blocks.2/self_attn/q_norm/Mul_1_output_0 /blocks.2/self_attn/q_norm/Mul_1"Mul  )/blocks.2/self_attn/q_norm/Mul_1_output_0*/blocks.2/self_attn/q_norm/Cast_2_output_0!/blocks.2/self_attn/q_norm/Cast_2"Cast* to  &/blocks.2/self_attn/Reshape_1_output_0(/blocks.2/self_attn/k_norm/Cast_output_0/blocks.2/self_attn/k_norm/Cast"Cast* to ,/blocks.2/self_attn/k_norm/Constant_output_0#/blocks.2/self_attn/k_norm/Constant"Constant*E value*9B//blocks.2/self_attn/k_norm/Constant_attr::valueJ@  (/blocks.2/self_attn/k_norm/Cast_output_0 ,/blocks.2/self_attn/k_norm/Constant_output_0'/blocks.2/self_attn/k_norm/Pow_output_0/blocks.2/self_attn/k_norm/Pow"Pow  '/blocks.2/self_attn/k_norm/Pow_output_0./blocks.2/self_attn/k_norm/ReduceMean_output_0%/blocks.2/self_attn/k_norm/ReduceMean" ReduceMean* axes@* keepdims ./blocks.2/self_attn/k_norm/Constant_1_output_0%/blocks.2/self_attn/k_norm/Constant_1"Constant*G value*;B1/blocks.2/self_attn/k_norm/Constant_1_attr::valueJ75  ./blocks.2/self_attn/k_norm/ReduceMean_output_0 ./blocks.2/self_attn/k_norm/Constant_1_output_0'/blocks.2/self_attn/k_norm/Add_output_0/blocks.2/self_attn/k_norm/Add"Add z '/blocks.2/self_attn/k_norm/Add_output_0(/blocks.2/self_attn/k_norm/Sqrt_output_0/blocks.2/self_attn/k_norm/Sqrt"Sqrt ./blocks.2/self_attn/k_norm/Constant_2_output_0%/blocks.2/self_attn/k_norm/Constant_2"Constant*G value*;B1/blocks.2/self_attn/k_norm/Constant_2_attr::valueJ?  ./blocks.2/self_attn/k_norm/Constant_2_output_0 (/blocks.2/self_attn/k_norm/Sqrt_output_0'/blocks.2/self_attn/k_norm/Div_output_0/blocks.2/self_attn/k_norm/Div"Div  (/blocks.2/self_attn/k_norm/Cast_output_0*/blocks.2/self_attn/k_norm/Cast_1_output_0!/blocks.2/self_attn/k_norm/Cast_1"Cast* to  */blocks.2/self_attn/k_norm/Cast_1_output_0 '/blocks.2/self_attn/k_norm/Div_output_0'/blocks.2/self_attn/k_norm/Mul_output_0/blocks.2/self_attn/k_norm/Mul"Mul  '/blocks.2/self_attn/k_norm/Mul_output_0 blocks.2.self_attn.k_norm.weight)/blocks.2/self_attn/k_norm/Mul_1_output_0 /blocks.2/self_attn/k_norm/Mul_1"Mul  )/blocks.2/self_attn/k_norm/Mul_1_output_0*/blocks.2/self_attn/k_norm/Cast_2_output_0!/blocks.2/self_attn/k_norm/Cast_2"Cast* to  */blocks.2/self_attn/q_norm/Cast_2_output_0 %/blocks.0/self_attn/Gather_2_output_0 /blocks.2/self_attn/Mul_output_0/blocks.2/self_attn/Mul"Mul v */blocks.2/self_attn/q_norm/Cast_2_output_0$/blocks.2/self_attn/Shape_2_output_0/blocks.2/self_attn/Shape_2"Shape '/blocks.2/self_attn/Constant_8_output_0/blocks.2/self_attn/Constant_8"Constant*D value*8B*/blocks.2/self_attn/Constant_8_attr::valueJ  $/blocks.2/self_attn/Shape_2_output_0 '/blocks.2/self_attn/Constant_8_output_0%/blocks.2/self_attn/Gather_2_output_0/blocks.2/self_attn/Gather_2"Gather* axis '/blocks.2/self_attn/Constant_9_output_0/blocks.2/self_attn/Constant_9"Constant*D value*8B*/blocks.2/self_attn/Constant_9_attr::valueJ  %/blocks.2/self_attn/Gather_2_output_0 '/blocks.2/self_attn/Constant_9_output_0 /blocks.2/self_attn/Div_output_0/blocks.2/self_attn/Div"Div p /blocks.2/self_attn/Div_output_0!/blocks.2/self_attn/Cast_output_0/blocks.2/self_attn/Cast"Cast* to u !/blocks.2/self_attn/Cast_output_0#/blocks.2/self_attn/Cast_1_output_0/blocks.2/self_attn/Cast_1"Cast* to (/blocks.2/self_attn/Constant_10_output_0/blocks.2/self_attn/Constant_10"Constant*G value*;B+/blocks.2/self_attn/Constant_10_attr::valueJ (/blocks.2/self_attn/Constant_11_output_0/blocks.2/self_attn/Constant_11"Constant*G value*;B+/blocks.2/self_attn/Constant_11_attr::valueJ (/blocks.2/self_attn/Constant_12_output_0/blocks.2/self_attn/Constant_12"Constant*G value*;B+/blocks.2/self_attn/Constant_12_attr::valueJ  #/blocks.2/self_attn/Cast_1_output_0 (/blocks.2/self_attn/Constant_12_output_0(/blocks.2/self_attn/Unsqueeze_6_output_0/blocks.2/self_attn/Unsqueeze_6" Unsqueeze (/blocks.2/self_attn/Constant_13_output_0/blocks.2/self_attn/Constant_13"Constant*G value*;B+/blocks.2/self_attn/Constant_13_attr::valueJ  */blocks.2/self_attn/q_norm/Cast_2_output_0 (/blocks.2/self_attn/Constant_11_output_0 (/blocks.2/self_attn/Unsqueeze_6_output_0 (/blocks.2/self_attn/Constant_10_output_0 (/blocks.2/self_attn/Constant_13_output_0"/blocks.2/self_attn/Slice_output_0/blocks.2/self_attn/Slice"Slice (/blocks.2/self_attn/Constant_14_output_0/blocks.2/self_attn/Constant_14"Constant*G value*;B+/blocks.2/self_attn/Constant_14_attr::valueJ (/blocks.2/self_attn/Constant_15_output_0/blocks.2/self_attn/Constant_15"Constant*G value*;B+/blocks.2/self_attn/Constant_15_attr::valueJ  #/blocks.2/self_attn/Cast_1_output_0 (/blocks.2/self_attn/Constant_15_output_0(/blocks.2/self_attn/Unsqueeze_7_output_0/blocks.2/self_attn/Unsqueeze_7" Unsqueeze (/blocks.2/self_attn/Constant_16_output_0/blocks.2/self_attn/Constant_16"Constant*G value*;B+/blocks.2/self_attn/Constant_16_attr::valueJ (/blocks.2/self_attn/Constant_17_output_0/blocks.2/self_attn/Constant_17"Constant*G value*;B+/blocks.2/self_attn/Constant_17_attr::valueJ  */blocks.2/self_attn/q_norm/Cast_2_output_0 (/blocks.2/self_attn/Unsqueeze_7_output_0 (/blocks.2/self_attn/Constant_16_output_0 (/blocks.2/self_attn/Constant_14_output_0 (/blocks.2/self_attn/Constant_17_output_0$/blocks.2/self_attn/Slice_1_output_0/blocks.2/self_attn/Slice_1"Slice f $/blocks.2/self_attn/Slice_1_output_0 /blocks.2/self_attn/Neg_output_0/blocks.2/self_attn/Neg"Neg  /blocks.2/self_attn/Neg_output_0 "/blocks.2/self_attn/Slice_output_0%/blocks.2/self_attn/Concat_3_output_0/blocks.2/self_attn/Concat_3"Concat* axis  %/blocks.2/self_attn/Concat_3_output_0 %/blocks.0/self_attn/Gather_3_output_0"/blocks.2/self_attn/Mul_1_output_0/blocks.2/self_attn/Mul_1"Mul  /blocks.2/self_attn/Mul_output_0 "/blocks.2/self_attn/Mul_1_output_0 /blocks.2/self_attn/Add_output_0/blocks.2/self_attn/Add"Add  */blocks.2/self_attn/k_norm/Cast_2_output_0 %/blocks.0/self_attn/Gather_2_output_0"/blocks.2/self_attn/Mul_2_output_0/blocks.2/self_attn/Mul_2"Mul v */blocks.2/self_attn/k_norm/Cast_2_output_0$/blocks.2/self_attn/Shape_3_output_0/blocks.2/self_attn/Shape_3"Shape (/blocks.2/self_attn/Constant_18_output_0/blocks.2/self_attn/Constant_18"Constant*E value*9B+/blocks.2/self_attn/Constant_18_attr::valueJ  $/blocks.2/self_attn/Shape_3_output_0 (/blocks.2/self_attn/Constant_18_output_0%/blocks.2/self_attn/Gather_3_output_0/blocks.2/self_attn/Gather_3"Gather* axis (/blocks.2/self_attn/Constant_19_output_0/blocks.2/self_attn/Constant_19"Constant*E value*9B+/blocks.2/self_attn/Constant_19_attr::valueJ  %/blocks.2/self_attn/Gather_3_output_0 (/blocks.2/self_attn/Constant_19_output_0"/blocks.2/self_attn/Div_1_output_0/blocks.2/self_attn/Div_1"Div v "/blocks.2/self_attn/Div_1_output_0#/blocks.2/self_attn/Cast_2_output_0/blocks.2/self_attn/Cast_2"Cast* to w #/blocks.2/self_attn/Cast_2_output_0#/blocks.2/self_attn/Cast_3_output_0/blocks.2/self_attn/Cast_3"Cast* to (/blocks.2/self_attn/Constant_20_output_0/blocks.2/self_attn/Constant_20"Constant*G value*;B+/blocks.2/self_attn/Constant_20_attr::valueJ (/blocks.2/self_attn/Constant_21_output_0/blocks.2/self_attn/Constant_21"Constant*G value*;B+/blocks.2/self_attn/Constant_21_attr::valueJ (/blocks.2/self_attn/Constant_22_output_0/blocks.2/self_attn/Constant_22"Constant*G value*;B+/blocks.2/self_attn/Constant_22_attr::valueJ  #/blocks.2/self_attn/Cast_3_output_0 (/blocks.2/self_attn/Constant_22_output_0(/blocks.2/self_attn/Unsqueeze_8_output_0/blocks.2/self_attn/Unsqueeze_8" Unsqueeze (/blocks.2/self_attn/Constant_23_output_0/blocks.2/self_attn/Constant_23"Constant*G value*;B+/blocks.2/self_attn/Constant_23_attr::valueJ  */blocks.2/self_attn/k_norm/Cast_2_output_0 (/blocks.2/self_attn/Constant_21_output_0 (/blocks.2/self_attn/Unsqueeze_8_output_0 (/blocks.2/self_attn/Constant_20_output_0 (/blocks.2/self_attn/Constant_23_output_0$/blocks.2/self_attn/Slice_2_output_0/blocks.2/self_attn/Slice_2"Slice (/blocks.2/self_attn/Constant_24_output_0/blocks.2/self_attn/Constant_24"Constant*G value*;B+/blocks.2/self_attn/Constant_24_attr::valueJ (/blocks.2/self_attn/Constant_25_output_0/blocks.2/self_attn/Constant_25"Constant*G value*;B+/blocks.2/self_attn/Constant_25_attr::valueJ  #/blocks.2/self_attn/Cast_3_output_0 (/blocks.2/self_attn/Constant_25_output_0(/blocks.2/self_attn/Unsqueeze_9_output_0/blocks.2/self_attn/Unsqueeze_9" Unsqueeze (/blocks.2/self_attn/Constant_26_output_0/blocks.2/self_attn/Constant_26"Constant*G value*;B+/blocks.2/self_attn/Constant_26_attr::valueJ (/blocks.2/self_attn/Constant_27_output_0/blocks.2/self_attn/Constant_27"Constant*G value*;B+/blocks.2/self_attn/Constant_27_attr::valueJ  */blocks.2/self_attn/k_norm/Cast_2_output_0 (/blocks.2/self_attn/Unsqueeze_9_output_0 (/blocks.2/self_attn/Constant_26_output_0 (/blocks.2/self_attn/Constant_24_output_0 (/blocks.2/self_attn/Constant_27_output_0$/blocks.2/self_attn/Slice_3_output_0/blocks.2/self_attn/Slice_3"Slice j $/blocks.2/self_attn/Slice_3_output_0"/blocks.2/self_attn/Neg_1_output_0/blocks.2/self_attn/Neg_1"Neg  "/blocks.2/self_attn/Neg_1_output_0 $/blocks.2/self_attn/Slice_2_output_0%/blocks.2/self_attn/Concat_4_output_0/blocks.2/self_attn/Concat_4"Concat* axis  %/blocks.2/self_attn/Concat_4_output_0 %/blocks.0/self_attn/Gather_3_output_0"/blocks.2/self_attn/Mul_3_output_0/blocks.2/self_attn/Mul_3"Mul  "/blocks.2/self_attn/Mul_2_output_0 "/blocks.2/self_attn/Mul_3_output_0"/blocks.2/self_attn/Add_1_output_0/blocks.2/self_attn/Add_1"Add  /Gather_2_output_0 /rotary/Constant_3_output_0%/blocks.2/self_attn/Gather_4_output_0/blocks.2/self_attn/Gather_4"Gather* axis  /Gather_2_output_0 /rotary/Constant_8_output_0%/blocks.2/self_attn/Gather_5_output_0/blocks.2/self_attn/Gather_5"Gather* axis  %/blocks.2/self_attn/Gather_4_output_0 "/blocks.2/self_attn/Add_1_output_0%/blocks.2/self_attn/Concat_5_output_0/blocks.2/self_attn/Concat_5"Concat* axis  %/blocks.2/self_attn/Gather_5_output_0 &/blocks.2/self_attn/Reshape_2_output_0%/blocks.2/self_attn/Concat_6_output_0/blocks.2/self_attn/Concat_6"Concat* axis (/blocks.2/self_attn/Constant_28_output_0/blocks.2/self_attn/Constant_28"Constant*G value*;B+/blocks.2/self_attn/Constant_28_attr::valueJ  %/blocks.2/self_attn/Concat_5_output_0 (/blocks.2/self_attn/Constant_28_output_0)/blocks.2/self_attn/Unsqueeze_10_output_0 /blocks.2/self_attn/Unsqueeze_10" Unsqueeze (/blocks.2/self_attn/Constant_29_output_0/blocks.2/self_attn/Constant_29"Constant*G value*;B+/blocks.2/self_attn/Constant_29_attr::valueJ  %/blocks.2/self_attn/Concat_6_output_0 (/blocks.2/self_attn/Constant_29_output_0)/blocks.2/self_attn/Unsqueeze_11_output_0 /blocks.2/self_attn/Unsqueeze_11" Unsqueeze  )/blocks.2/self_attn/Unsqueeze_10_output_0 )/blocks.2/self_attn/Unsqueeze_11_output_0%/blocks.2/self_attn/Concat_7_output_0/blocks.2/self_attn/Concat_7"Concat* axis  /blocks.2/self_attn/Add_output_0&/blocks.2/self_attn/Transpose_output_0/blocks.2/self_attn/Transpose" Transpose* perm@@@@  %/blocks.2/self_attn/Concat_5_output_0(/blocks.2/self_attn/Transpose_1_output_0/blocks.2/self_attn/Transpose_1" Transpose* perm@@@@  %/blocks.2/self_attn/Concat_6_output_0(/blocks.2/self_attn/Transpose_2_output_0/blocks.2/self_attn/Transpose_2" Transpose* perm@@@@ t (/blocks.2/self_attn/Transpose_1_output_0$/blocks.2/self_attn/Shape_4_output_0/blocks.2/self_attn/Shape_4"Shape (/blocks.2/self_attn/Constant_30_output_0/blocks.2/self_attn/Constant_30"Constant*E value*9B+/blocks.2/self_attn/Constant_30_attr::valueJ  $/blocks.2/self_attn/Shape_4_output_0 (/blocks.2/self_attn/Constant_30_output_0%/blocks.2/self_attn/Gather_6_output_0/blocks.2/self_attn/Gather_6"Gather* axis t (/blocks.2/self_attn/Transpose_1_output_0$/blocks.2/self_attn/Shape_5_output_0/blocks.2/self_attn/Shape_5"Shape (/blocks.2/self_attn/Constant_31_output_0/blocks.2/self_attn/Constant_31"Constant*E value*9B+/blocks.2/self_attn/Constant_31_attr::valueJ  $/blocks.2/self_attn/Shape_5_output_0 (/blocks.2/self_attn/Constant_31_output_0%/blocks.2/self_attn/Gather_7_output_0/blocks.2/self_attn/Gather_7"Gather* axis t (/blocks.2/self_attn/Transpose_1_output_0$/blocks.2/self_attn/Shape_6_output_0/blocks.2/self_attn/Shape_6"Shape (/blocks.2/self_attn/Constant_32_output_0/blocks.2/self_attn/Constant_32"Constant*E value*9B+/blocks.2/self_attn/Constant_32_attr::valueJ  $/blocks.2/self_attn/Shape_6_output_0 (/blocks.2/self_attn/Constant_32_output_0%/blocks.2/self_attn/Gather_8_output_0/blocks.2/self_attn/Gather_8"Gather* axis t (/blocks.2/self_attn/Transpose_1_output_0$/blocks.2/self_attn/Shape_7_output_0/blocks.2/self_attn/Shape_7"Shape (/blocks.2/self_attn/Constant_33_output_0/blocks.2/self_attn/Constant_33"Constant*E value*9B+/blocks.2/self_attn/Constant_33_attr::valueJ  $/blocks.2/self_attn/Shape_7_output_0 (/blocks.2/self_attn/Constant_33_output_0%/blocks.2/self_attn/Gather_9_output_0/blocks.2/self_attn/Gather_9"Gather* axis (/blocks.2/self_attn/Constant_34_output_0/blocks.2/self_attn/Constant_34"Constant*G value*;B+/blocks.2/self_attn/Constant_34_attr::valueJ  (/blocks.2/self_attn/Transpose_1_output_0 (/blocks.2/self_attn/Constant_34_output_0)/blocks.2/self_attn/Unsqueeze_12_output_0 /blocks.2/self_attn/Unsqueeze_12" Unsqueeze (/blocks.2/self_attn/Constant_35_output_0/blocks.2/self_attn/Constant_35"Constant*G value*;B+/blocks.2/self_attn/Constant_35_attr::valueJ  %/blocks.2/self_attn/Gather_6_output_0 (/blocks.2/self_attn/Constant_35_output_0)/blocks.2/self_attn/Unsqueeze_13_output_0 /blocks.2/self_attn/Unsqueeze_13" Unsqueeze (/blocks.2/self_attn/Constant_36_output_0/blocks.2/self_attn/Constant_36"Constant*G value*;B+/blocks.2/self_attn/Constant_36_attr::valueJ  %/blocks.2/self_attn/Gather_7_output_0 (/blocks.2/self_attn/Constant_36_output_0)/blocks.2/self_attn/Unsqueeze_14_output_0 /blocks.2/self_attn/Unsqueeze_14" Unsqueeze (/blocks.2/self_attn/Constant_37_output_0/blocks.2/self_attn/Constant_37"Constant*G value*;B+/blocks.2/self_attn/Constant_37_attr::valueJ (/blocks.2/self_attn/Constant_38_output_0/blocks.2/self_attn/Constant_38"Constant*G value*;B+/blocks.2/self_attn/Constant_38_attr::valueJ  %/blocks.2/self_attn/Gather_8_output_0 (/blocks.2/self_attn/Constant_38_output_0)/blocks.2/self_attn/Unsqueeze_15_output_0 /blocks.2/self_attn/Unsqueeze_15" Unsqueeze (/blocks.2/self_attn/Constant_39_output_0/blocks.2/self_attn/Constant_39"Constant*G value*;B+/blocks.2/self_attn/Constant_39_attr::valueJ  %/blocks.2/self_attn/Gather_9_output_0 (/blocks.2/self_attn/Constant_39_output_0)/blocks.2/self_attn/Unsqueeze_16_output_0 /blocks.2/self_attn/Unsqueeze_16" Unsqueeze  )/blocks.2/self_attn/Unsqueeze_13_output_0 )/blocks.2/self_attn/Unsqueeze_14_output_0 (/blocks.2/self_attn/Constant_37_output_0 )/blocks.2/self_attn/Unsqueeze_15_output_0 )/blocks.2/self_attn/Unsqueeze_16_output_0%/blocks.2/self_attn/Concat_8_output_0/blocks.2/self_attn/Concat_8"Concat* axis (/blocks.2/self_attn/Constant_40_output_0/blocks.2/self_attn/Constant_40"Constant*G value*;B+/blocks.2/self_attn/Constant_40_attr::valueJ  %/blocks.2/self_attn/Concat_8_output_0 (/blocks.2/self_attn/Constant_40_output_0&/blocks.2/self_attn/Reshape_3_output_0/blocks.2/self_attn/Reshape_3"Reshape* allowzero r &/blocks.2/self_attn/Reshape_3_output_0$/blocks.2/self_attn/Shape_8_output_0/blocks.2/self_attn/Shape_8"Shape  $/blocks.2/self_attn/Shape_8_output_0,/blocks.2/self_attn/ConstantOfShape_output_0#/blocks.2/self_attn/ConstantOfShape"ConstantOfShape*K value*?B//blocks.2/self_attn/ConstantOfShape_attr::valueJ (/blocks.2/self_attn/Constant_41_output_0/blocks.2/self_attn/Constant_41"Constant*E value*9B+/blocks.2/self_attn/Constant_41_attr::valueJ  ,/blocks.2/self_attn/ConstantOfShape_output_0 (/blocks.2/self_attn/Constant_41_output_0"/blocks.2/self_attn/Mul_4_output_0/blocks.2/self_attn/Mul_4"Mul  &/blocks.2/self_attn/Reshape_3_output_0 "/blocks.2/self_attn/Mul_4_output_0"/blocks.2/self_attn/Equal_output_0/blocks.2/self_attn/Equal"Equal  "/blocks.2/self_attn/Equal_output_0 ,/blocks.2/self_attn/ConstantOfShape_output_0 &/blocks.2/self_attn/Reshape_3_output_0"/blocks.2/self_attn/Where_output_0/blocks.2/self_attn/Where"Where  )/blocks.2/self_attn/Unsqueeze_12_output_0 "/blocks.2/self_attn/Where_output_0#/blocks.2/self_attn/Expand_output_0/blocks.2/self_attn/Expand"Expand (/blocks.2/self_attn/Constant_42_output_0/blocks.2/self_attn/Constant_42"Constant*E value*9B+/blocks.2/self_attn/Constant_42_attr::valueJ  %/blocks.2/self_attn/Gather_7_output_0 (/blocks.2/self_attn/Constant_42_output_0"/blocks.2/self_attn/Mul_5_output_0/blocks.2/self_attn/Mul_5"Mul fonnx::Unsqueeze_1118 Constant_3225"Constant*5 value*)BConstant_3225_attr::valueJ  %/blocks.2/self_attn/Gather_6_output_0 onnx::Unsqueeze_1118)/blocks.2/self_attn/Unsqueeze_17_output_0 /blocks.2/self_attn/Unsqueeze_17" Unsqueeze fonnx::Unsqueeze_1120 Constant_3227"Constant*5 value*)BConstant_3227_attr::valueJ  "/blocks.2/self_attn/Mul_5_output_0 onnx::Unsqueeze_1120)/blocks.2/self_attn/Unsqueeze_18_output_0 /blocks.2/self_attn/Unsqueeze_18" Unsqueeze fonnx::Unsqueeze_1122 Constant_3229"Constant*5 value*)BConstant_3229_attr::valueJ  %/blocks.2/self_attn/Gather_8_output_0 onnx::Unsqueeze_1122)/blocks.2/self_attn/Unsqueeze_19_output_0 /blocks.2/self_attn/Unsqueeze_19" Unsqueeze fonnx::Unsqueeze_1124 Constant_3231"Constant*5 value*)BConstant_3231_attr::valueJ  %/blocks.2/self_attn/Gather_9_output_0 onnx::Unsqueeze_1124)/blocks.2/self_attn/Unsqueeze_20_output_0 /blocks.2/self_attn/Unsqueeze_20" Unsqueeze  )/blocks.2/self_attn/Unsqueeze_17_output_0 )/blocks.2/self_attn/Unsqueeze_18_output_0 )/blocks.2/self_attn/Unsqueeze_19_output_0 )/blocks.2/self_attn/Unsqueeze_20_output_0%/blocks.2/self_attn/Concat_9_output_0/blocks.2/self_attn/Concat_9"Concat* axis  #/blocks.2/self_attn/Expand_output_0 %/blocks.2/self_attn/Concat_9_output_0&/blocks.2/self_attn/Reshape_4_output_0/blocks.2/self_attn/Reshape_4"Reshape* allowzero t (/blocks.2/self_attn/Transpose_2_output_0$/blocks.2/self_attn/Shape_9_output_0/blocks.2/self_attn/Shape_9"Shape (/blocks.2/self_attn/Constant_43_output_0/blocks.2/self_attn/Constant_43"Constant*E value*9B+/blocks.2/self_attn/Constant_43_attr::valueJ  $/blocks.2/self_attn/Shape_9_output_0 (/blocks.2/self_attn/Constant_43_output_0&/blocks.2/self_attn/Gather_10_output_0/blocks.2/self_attn/Gather_10"Gather* axis v (/blocks.2/self_attn/Transpose_2_output_0%/blocks.2/self_attn/Shape_10_output_0/blocks.2/self_attn/Shape_10"Shape (/blocks.2/self_attn/Constant_44_output_0/blocks.2/self_attn/Constant_44"Constant*E value*9B+/blocks.2/self_attn/Constant_44_attr::valueJ  %/blocks.2/self_attn/Shape_10_output_0 (/blocks.2/self_attn/Constant_44_output_0&/blocks.2/self_attn/Gather_11_output_0/blocks.2/self_attn/Gather_11"Gather* axis v (/blocks.2/self_attn/Transpose_2_output_0%/blocks.2/self_attn/Shape_11_output_0/blocks.2/self_attn/Shape_11"Shape (/blocks.2/self_attn/Constant_45_output_0/blocks.2/self_attn/Constant_45"Constant*E value*9B+/blocks.2/self_attn/Constant_45_attr::valueJ  %/blocks.2/self_attn/Shape_11_output_0 (/blocks.2/self_attn/Constant_45_output_0&/blocks.2/self_attn/Gather_12_output_0/blocks.2/self_attn/Gather_12"Gather* axis v (/blocks.2/self_attn/Transpose_2_output_0%/blocks.2/self_attn/Shape_12_output_0/blocks.2/self_attn/Shape_12"Shape (/blocks.2/self_attn/Constant_46_output_0/blocks.2/self_attn/Constant_46"Constant*E value*9B+/blocks.2/self_attn/Constant_46_attr::valueJ  %/blocks.2/self_attn/Shape_12_output_0 (/blocks.2/self_attn/Constant_46_output_0&/blocks.2/self_attn/Gather_13_output_0/blocks.2/self_attn/Gather_13"Gather* axis (/blocks.2/self_attn/Constant_47_output_0/blocks.2/self_attn/Constant_47"Constant*G value*;B+/blocks.2/self_attn/Constant_47_attr::valueJ  (/blocks.2/self_attn/Transpose_2_output_0 (/blocks.2/self_attn/Constant_47_output_0)/blocks.2/self_attn/Unsqueeze_21_output_0 /blocks.2/self_attn/Unsqueeze_21" Unsqueeze (/blocks.2/self_attn/Constant_48_output_0/blocks.2/self_attn/Constant_48"Constant*G value*;B+/blocks.2/self_attn/Constant_48_attr::valueJ  &/blocks.2/self_attn/Gather_10_output_0 (/blocks.2/self_attn/Constant_48_output_0)/blocks.2/self_attn/Unsqueeze_22_output_0 /blocks.2/self_attn/Unsqueeze_22" Unsqueeze (/blocks.2/self_attn/Constant_49_output_0/blocks.2/self_attn/Constant_49"Constant*G value*;B+/blocks.2/self_attn/Constant_49_attr::valueJ  &/blocks.2/self_attn/Gather_11_output_0 (/blocks.2/self_attn/Constant_49_output_0)/blocks.2/self_attn/Unsqueeze_23_output_0 /blocks.2/self_attn/Unsqueeze_23" Unsqueeze (/blocks.2/self_attn/Constant_50_output_0/blocks.2/self_attn/Constant_50"Constant*G value*;B+/blocks.2/self_attn/Constant_50_attr::valueJ (/blocks.2/self_attn/Constant_51_output_0/blocks.2/self_attn/Constant_51"Constant*G value*;B+/blocks.2/self_attn/Constant_51_attr::valueJ  &/blocks.2/self_attn/Gather_12_output_0 (/blocks.2/self_attn/Constant_51_output_0)/blocks.2/self_attn/Unsqueeze_24_output_0 /blocks.2/self_attn/Unsqueeze_24" Unsqueeze (/blocks.2/self_attn/Constant_52_output_0/blocks.2/self_attn/Constant_52"Constant*G value*;B+/blocks.2/self_attn/Constant_52_attr::valueJ  &/blocks.2/self_attn/Gather_13_output_0 (/blocks.2/self_attn/Constant_52_output_0)/blocks.2/self_attn/Unsqueeze_25_output_0 /blocks.2/self_attn/Unsqueeze_25" Unsqueeze  )/blocks.2/self_attn/Unsqueeze_22_output_0 )/blocks.2/self_attn/Unsqueeze_23_output_0 (/blocks.2/self_attn/Constant_50_output_0 )/blocks.2/self_attn/Unsqueeze_24_output_0 )/blocks.2/self_attn/Unsqueeze_25_output_0&/blocks.2/self_attn/Concat_10_output_0/blocks.2/self_attn/Concat_10"Concat* axis (/blocks.2/self_attn/Constant_53_output_0/blocks.2/self_attn/Constant_53"Constant*G value*;B+/blocks.2/self_attn/Constant_53_attr::valueJ  &/blocks.2/self_attn/Concat_10_output_0 (/blocks.2/self_attn/Constant_53_output_0&/blocks.2/self_attn/Reshape_5_output_0/blocks.2/self_attn/Reshape_5"Reshape* allowzero t &/blocks.2/self_attn/Reshape_5_output_0%/blocks.2/self_attn/Shape_13_output_0/blocks.2/self_attn/Shape_13"Shape  %/blocks.2/self_attn/Shape_13_output_0./blocks.2/self_attn/ConstantOfShape_1_output_0%/blocks.2/self_attn/ConstantOfShape_1"ConstantOfShape*M value*AB1/blocks.2/self_attn/ConstantOfShape_1_attr::valueJ (/blocks.2/self_attn/Constant_54_output_0/blocks.2/self_attn/Constant_54"Constant*E value*9B+/blocks.2/self_attn/Constant_54_attr::valueJ  ./blocks.2/self_attn/ConstantOfShape_1_output_0 (/blocks.2/self_attn/Constant_54_output_0"/blocks.2/self_attn/Mul_6_output_0/blocks.2/self_attn/Mul_6"Mul  &/blocks.2/self_attn/Reshape_5_output_0 "/blocks.2/self_attn/Mul_6_output_0$/blocks.2/self_attn/Equal_1_output_0/blocks.2/self_attn/Equal_1"Equal  $/blocks.2/self_attn/Equal_1_output_0 ./blocks.2/self_attn/ConstantOfShape_1_output_0 &/blocks.2/self_attn/Reshape_5_output_0$/blocks.2/self_attn/Where_1_output_0/blocks.2/self_attn/Where_1"Where  )/blocks.2/self_attn/Unsqueeze_21_output_0 $/blocks.2/self_attn/Where_1_output_0%/blocks.2/self_attn/Expand_1_output_0/blocks.2/self_attn/Expand_1"Expand (/blocks.2/self_attn/Constant_55_output_0/blocks.2/self_attn/Constant_55"Constant*E value*9B+/blocks.2/self_attn/Constant_55_attr::valueJ  &/blocks.2/self_attn/Gather_11_output_0 (/blocks.2/self_attn/Constant_55_output_0"/blocks.2/self_attn/Mul_7_output_0/blocks.2/self_attn/Mul_7"Mul fonnx::Unsqueeze_1164 Constant_3270"Constant*5 value*)BConstant_3270_attr::valueJ  &/blocks.2/self_attn/Gather_10_output_0 onnx::Unsqueeze_1164)/blocks.2/self_attn/Unsqueeze_26_output_0 /blocks.2/self_attn/Unsqueeze_26" Unsqueeze fonnx::Unsqueeze_1166 Constant_3272"Constant*5 value*)BConstant_3272_attr::valueJ  "/blocks.2/self_attn/Mul_7_output_0 onnx::Unsqueeze_1166)/blocks.2/self_attn/Unsqueeze_27_output_0 /blocks.2/self_attn/Unsqueeze_27" Unsqueeze fonnx::Unsqueeze_1168 Constant_3274"Constant*5 value*)BConstant_3274_attr::valueJ  &/blocks.2/self_attn/Gather_12_output_0 onnx::Unsqueeze_1168)/blocks.2/self_attn/Unsqueeze_28_output_0 /blocks.2/self_attn/Unsqueeze_28" Unsqueeze fonnx::Unsqueeze_1170 Constant_3276"Constant*5 value*)BConstant_3276_attr::valueJ  &/blocks.2/self_attn/Gather_13_output_0 onnx::Unsqueeze_1170)/blocks.2/self_attn/Unsqueeze_29_output_0 /blocks.2/self_attn/Unsqueeze_29" Unsqueeze  )/blocks.2/self_attn/Unsqueeze_26_output_0 )/blocks.2/self_attn/Unsqueeze_27_output_0 )/blocks.2/self_attn/Unsqueeze_28_output_0 )/blocks.2/self_attn/Unsqueeze_29_output_0&/blocks.2/self_attn/Concat_11_output_0/blocks.2/self_attn/Concat_11"Concat* axis  %/blocks.2/self_attn/Expand_1_output_0 &/blocks.2/self_attn/Concat_11_output_0&/blocks.2/self_attn/Reshape_6_output_0/blocks.2/self_attn/Reshape_6"Reshape* allowzero  &/blocks.2/self_attn/Transpose_output_0 &/blocks.2/self_attn/Reshape_4_output_0#/blocks.2/self_attn/MatMul_output_0/blocks.2/self_attn/MatMul"MatMul (/blocks.2/self_attn/Constant_56_output_0/blocks.2/self_attn/Constant_56"Constant*A value*5B+/blocks.2/self_attn/Constant_56_attr::valueJ5A  #/blocks.2/self_attn/MatMul_output_0 (/blocks.2/self_attn/Constant_56_output_0"/blocks.2/self_attn/Div_2_output_0/blocks.2/self_attn/Div_2"Div x "/blocks.2/self_attn/Div_2_output_0 attention_mask"/blocks.2/self_attn/Add_2_output_0/blocks.2/self_attn/Add_2"Add  "/blocks.2/self_attn/Add_2_output_0$/blocks.2/self_attn/Softmax_output_0/blocks.2/self_attn/Softmax"Softmax* axis x $/blocks.2/self_attn/Softmax_output_0#/blocks.2/self_attn/Cast_4_output_0/blocks.2/self_attn/Cast_4"Cast* to  #/blocks.2/self_attn/Cast_4_output_0 &/blocks.2/self_attn/Reshape_6_output_0%/blocks.2/self_attn/MatMul_1_output_0/blocks.2/self_attn/MatMul_1"MatMul  %/blocks.2/self_attn/MatMul_1_output_0(/blocks.2/self_attn/Transpose_3_output_0/blocks.2/self_attn/Transpose_3" Transpose* perm@@@@ fonnx::Unsqueeze_1182 Constant_3288"Constant*5 value*)BConstant_3288_attr::valueJ  #/blocks.2/self_attn/Gather_output_0 onnx::Unsqueeze_1182)/blocks.2/self_attn/Unsqueeze_30_output_0 /blocks.2/self_attn/Unsqueeze_30" Unsqueeze fonnx::Unsqueeze_1184 Constant_3290"Constant*5 value*)BConstant_3290_attr::valueJ  %/blocks.2/self_attn/Gather_1_output_0 onnx::Unsqueeze_1184)/blocks.2/self_attn/Unsqueeze_31_output_0 /blocks.2/self_attn/Unsqueeze_31" Unsqueeze (/blocks.2/self_attn/Constant_57_output_0/blocks.2/self_attn/Constant_57"Constant*G value*;B+/blocks.2/self_attn/Constant_57_attr::valueJ  )/blocks.2/self_attn/Unsqueeze_30_output_0 )/blocks.2/self_attn/Unsqueeze_31_output_0 (/blocks.2/self_attn/Constant_57_output_0&/blocks.2/self_attn/Concat_12_output_0/blocks.2/self_attn/Concat_12"Concat* axis  (/blocks.2/self_attn/Transpose_3_output_0 &/blocks.2/self_attn/Concat_12_output_0&/blocks.2/self_attn/Reshape_7_output_0/blocks.2/self_attn/Reshape_7"Reshape* allowzero  &/blocks.2/self_attn/Reshape_7_output_0 onnx::MatMul_8645*/blocks.2/self_attn/o_proj/MatMul_output_0!/blocks.2/self_attn/o_proj/MatMul"MatMul  )/blocks.2/input_layernorm/Cast_1_output_0 */blocks.2/self_attn/o_proj/MatMul_output_0/blocks.2/Add_output_0 /blocks.2/Add"Add  /blocks.2/Add_output_00/blocks.2/post_attention_layernorm/Cast_output_0'/blocks.2/post_attention_layernorm/Cast"Cast* to 4/blocks.2/post_attention_layernorm/Constant_output_0+/blocks.2/post_attention_layernorm/Constant"Constant*M value*AB7/blocks.2/post_attention_layernorm/Constant_attr::valueJ@  0/blocks.2/post_attention_layernorm/Cast_output_0 4/blocks.2/post_attention_layernorm/Constant_output_0//blocks.2/post_attention_layernorm/Pow_output_0&/blocks.2/post_attention_layernorm/Pow"Pow  //blocks.2/post_attention_layernorm/Pow_output_06/blocks.2/post_attention_layernorm/ReduceMean_output_0-/blocks.2/post_attention_layernorm/ReduceMean" ReduceMean* axes@* keepdims 6/blocks.2/post_attention_layernorm/Constant_1_output_0-/blocks.2/post_attention_layernorm/Constant_1"Constant*O value*CB9/blocks.2/post_attention_layernorm/Constant_1_attr::valueJ75  6/blocks.2/post_attention_layernorm/ReduceMean_output_0 6/blocks.2/post_attention_layernorm/Constant_1_output_0//blocks.2/post_attention_layernorm/Add_output_0&/blocks.2/post_attention_layernorm/Add"Add  //blocks.2/post_attention_layernorm/Add_output_00/blocks.2/post_attention_layernorm/Sqrt_output_0'/blocks.2/post_attention_layernorm/Sqrt"Sqrt 6/blocks.2/post_attention_layernorm/Constant_2_output_0-/blocks.2/post_attention_layernorm/Constant_2"Constant*O value*CB9/blocks.2/post_attention_layernorm/Constant_2_attr::valueJ?  6/blocks.2/post_attention_layernorm/Constant_2_output_0 0/blocks.2/post_attention_layernorm/Sqrt_output_0//blocks.2/post_attention_layernorm/Div_output_0&/blocks.2/post_attention_layernorm/Div"Div  0/blocks.2/post_attention_layernorm/Cast_output_02/blocks.2/post_attention_layernorm/Cast_1_output_0)/blocks.2/post_attention_layernorm/Cast_1"Cast* to  2/blocks.2/post_attention_layernorm/Cast_1_output_0 //blocks.2/post_attention_layernorm/Div_output_0//blocks.2/post_attention_layernorm/Mul_output_0&/blocks.2/post_attention_layernorm/Mul"Mul  //blocks.2/post_attention_layernorm/Mul_output_0 (blocks.2.post_attention_layernorm.weight1/blocks.2/post_attention_layernorm/Mul_1_output_0(/blocks.2/post_attention_layernorm/Mul_1"Mul  1/blocks.2/post_attention_layernorm/Mul_1_output_02/blocks.2/post_attention_layernorm/Cast_2_output_0)/blocks.2/post_attention_layernorm/Cast_2"Cast* to  2/blocks.2/post_attention_layernorm/Cast_2_output_0 onnx::MatMul_8646'/blocks.2/mlp/gate_proj/MatMul_output_0/blocks.2/mlp/gate_proj/MatMul"MatMul w '/blocks.2/mlp/gate_proj/MatMul_output_0%/blocks.2/mlp/act_fn/Sigmoid_output_0/blocks.2/mlp/act_fn/Sigmoid"Sigmoid  '/blocks.2/mlp/gate_proj/MatMul_output_0 %/blocks.2/mlp/act_fn/Sigmoid_output_0!/blocks.2/mlp/act_fn/Mul_output_0/blocks.2/mlp/act_fn/Mul"Mul  2/blocks.2/post_attention_layernorm/Cast_2_output_0 onnx::MatMul_8647%/blocks.2/mlp/up_proj/MatMul_output_0/blocks.2/mlp/up_proj/MatMul"MatMul ~ !/blocks.2/mlp/act_fn/Mul_output_0 %/blocks.2/mlp/up_proj/MatMul_output_0/blocks.2/mlp/Mul_output_0/blocks.2/mlp/Mul"Mul  /blocks.2/mlp/Mul_output_0 onnx::MatMul_8648'/blocks.2/mlp/down_proj/MatMul_output_0/blocks.2/mlp/down_proj/MatMul"MatMul  2/blocks.2/post_attention_layernorm/Cast_1_output_0 '/blocks.2/mlp/down_proj/MatMul_output_0/blocks.2/Add_1_output_0/blocks.2/Add_1"Add o past_key_values (/blocks.0/self_attn/Constant_10_output_0/Gather_3_output_0 /Gather_3"Gather* axis /blocks.3/Constant_output_0/blocks.3/Constant"Constant*J value*>B/blocks.3/Constant_attr::valueJ  /blocks.2/Add_1_output_0 /blocks.3/Constant_output_0/blocks.3/Reshape_output_0/blocks.3/Reshape"Reshape* allowzero v /blocks.3/Reshape_output_0'/blocks.3/input_layernorm/Cast_output_0/blocks.3/input_layernorm/Cast"Cast* to +/blocks.3/input_layernorm/Constant_output_0"/blocks.3/input_layernorm/Constant"Constant*D value*8B./blocks.3/input_layernorm/Constant_attr::valueJ@  '/blocks.3/input_layernorm/Cast_output_0 +/blocks.3/input_layernorm/Constant_output_0&/blocks.3/input_layernorm/Pow_output_0/blocks.3/input_layernorm/Pow"Pow  &/blocks.3/input_layernorm/Pow_output_0-/blocks.3/input_layernorm/ReduceMean_output_0$/blocks.3/input_layernorm/ReduceMean" ReduceMean* axes@* keepdims -/blocks.3/input_layernorm/Constant_1_output_0$/blocks.3/input_layernorm/Constant_1"Constant*F value*:B0/blocks.3/input_layernorm/Constant_1_attr::valueJ75  -/blocks.3/input_layernorm/ReduceMean_output_0 -/blocks.3/input_layernorm/Constant_1_output_0&/blocks.3/input_layernorm/Add_output_0/blocks.3/input_layernorm/Add"Add w &/blocks.3/input_layernorm/Add_output_0'/blocks.3/input_layernorm/Sqrt_output_0/blocks.3/input_layernorm/Sqrt"Sqrt -/blocks.3/input_layernorm/Constant_2_output_0$/blocks.3/input_layernorm/Constant_2"Constant*F value*:B0/blocks.3/input_layernorm/Constant_2_attr::valueJ?  -/blocks.3/input_layernorm/Constant_2_output_0 '/blocks.3/input_layernorm/Sqrt_output_0&/blocks.3/input_layernorm/Div_output_0/blocks.3/input_layernorm/Div"Div  '/blocks.3/input_layernorm/Cast_output_0)/blocks.3/input_layernorm/Cast_1_output_0 /blocks.3/input_layernorm/Cast_1"Cast* to  )/blocks.3/input_layernorm/Cast_1_output_0 &/blocks.3/input_layernorm/Div_output_0&/blocks.3/input_layernorm/Mul_output_0/blocks.3/input_layernorm/Mul"Mul  &/blocks.3/input_layernorm/Mul_output_0 blocks.3.input_layernorm.weight(/blocks.3/input_layernorm/Mul_1_output_0/blocks.3/input_layernorm/Mul_1"Mul  (/blocks.3/input_layernorm/Mul_1_output_0)/blocks.3/input_layernorm/Cast_2_output_0 /blocks.3/input_layernorm/Cast_2"Cast* to q )/blocks.3/input_layernorm/Cast_2_output_0"/blocks.3/self_attn/Shape_output_0/blocks.3/self_attn/Shape"Shape %/blocks.3/self_attn/Constant_output_0/blocks.3/self_attn/Constant"Constant*B value*6B(/blocks.3/self_attn/Constant_attr::valueJ  "/blocks.3/self_attn/Shape_output_0 %/blocks.3/self_attn/Constant_output_0#/blocks.3/self_attn/Gather_output_0/blocks.3/self_attn/Gather"Gather* axis u )/blocks.3/input_layernorm/Cast_2_output_0$/blocks.3/self_attn/Shape_1_output_0/blocks.3/self_attn/Shape_1"Shape '/blocks.3/self_attn/Constant_1_output_0/blocks.3/self_attn/Constant_1"Constant*D value*8B*/blocks.3/self_attn/Constant_1_attr::valueJ  $/blocks.3/self_attn/Shape_1_output_0 '/blocks.3/self_attn/Constant_1_output_0%/blocks.3/self_attn/Gather_1_output_0/blocks.3/self_attn/Gather_1"Gather* axis  )/blocks.3/input_layernorm/Cast_2_output_0 onnx::MatMul_8649*/blocks.3/self_attn/q_proj/MatMul_output_0!/blocks.3/self_attn/q_proj/MatMul"MatMul  )/blocks.3/input_layernorm/Cast_2_output_0 onnx::MatMul_8650*/blocks.3/self_attn/k_proj/MatMul_output_0!/blocks.3/self_attn/k_proj/MatMul"MatMul  )/blocks.3/input_layernorm/Cast_2_output_0 onnx::MatMul_8651*/blocks.3/self_attn/v_proj/MatMul_output_0!/blocks.3/self_attn/v_proj/MatMul"MatMul fonnx::Unsqueeze_1244 Constant_3342"Constant*5 value*)BConstant_3342_attr::valueJ  #/blocks.3/self_attn/Gather_output_0 onnx::Unsqueeze_1244&/blocks.3/self_attn/Unsqueeze_output_0/blocks.3/self_attn/Unsqueeze" Unsqueeze fonnx::Unsqueeze_1246 Constant_3344"Constant*5 value*)BConstant_3344_attr::valueJ  %/blocks.3/self_attn/Gather_1_output_0 onnx::Unsqueeze_1246(/blocks.3/self_attn/Unsqueeze_1_output_0/blocks.3/self_attn/Unsqueeze_1" Unsqueeze '/blocks.3/self_attn/Constant_2_output_0/blocks.3/self_attn/Constant_2"Constant*F value*:B*/blocks.3/self_attn/Constant_2_attr::valueJ '/blocks.3/self_attn/Constant_3_output_0/blocks.3/self_attn/Constant_3"Constant*F value*:B*/blocks.3/self_attn/Constant_3_attr::valueJ  &/blocks.3/self_attn/Unsqueeze_output_0 (/blocks.3/self_attn/Unsqueeze_1_output_0 '/blocks.3/self_attn/Constant_2_output_0 '/blocks.3/self_attn/Constant_3_output_0#/blocks.3/self_attn/Concat_output_0/blocks.3/self_attn/Concat"Concat* axis  */blocks.3/self_attn/q_proj/MatMul_output_0 #/blocks.3/self_attn/Concat_output_0$/blocks.3/self_attn/Reshape_output_0/blocks.3/self_attn/Reshape"Reshape* allowzero fonnx::Unsqueeze_1254 Constant_3350"Constant*5 value*)BConstant_3350_attr::valueJ  #/blocks.3/self_attn/Gather_output_0 onnx::Unsqueeze_1254(/blocks.3/self_attn/Unsqueeze_2_output_0/blocks.3/self_attn/Unsqueeze_2" Unsqueeze fonnx::Unsqueeze_1256 Constant_3352"Constant*5 value*)BConstant_3352_attr::valueJ  %/blocks.3/self_attn/Gather_1_output_0 onnx::Unsqueeze_1256(/blocks.3/self_attn/Unsqueeze_3_output_0/blocks.3/self_attn/Unsqueeze_3" Unsqueeze '/blocks.3/self_attn/Constant_4_output_0/blocks.3/self_attn/Constant_4"Constant*F value*:B*/blocks.3/self_attn/Constant_4_attr::valueJ '/blocks.3/self_attn/Constant_5_output_0/blocks.3/self_attn/Constant_5"Constant*F value*:B*/blocks.3/self_attn/Constant_5_attr::valueJ  (/blocks.3/self_attn/Unsqueeze_2_output_0 (/blocks.3/self_attn/Unsqueeze_3_output_0 '/blocks.3/self_attn/Constant_4_output_0 '/blocks.3/self_attn/Constant_5_output_0%/blocks.3/self_attn/Concat_1_output_0/blocks.3/self_attn/Concat_1"Concat* axis fonnx::Unsqueeze_1263 Constant_3357"Constant*5 value*)BConstant_3357_attr::valueJ  #/blocks.3/self_attn/Gather_output_0 onnx::Unsqueeze_1263(/blocks.3/self_attn/Unsqueeze_4_output_0/blocks.3/self_attn/Unsqueeze_4" Unsqueeze fonnx::Unsqueeze_1265 Constant_3359"Constant*5 value*)BConstant_3359_attr::valueJ  %/blocks.3/self_attn/Gather_1_output_0 onnx::Unsqueeze_1265(/blocks.3/self_attn/Unsqueeze_5_output_0/blocks.3/self_attn/Unsqueeze_5" Unsqueeze '/blocks.3/self_attn/Constant_6_output_0/blocks.3/self_attn/Constant_6"Constant*F value*:B*/blocks.3/self_attn/Constant_6_attr::valueJ '/blocks.3/self_attn/Constant_7_output_0/blocks.3/self_attn/Constant_7"Constant*F value*:B*/blocks.3/self_attn/Constant_7_attr::valueJ  (/blocks.3/self_attn/Unsqueeze_4_output_0 (/blocks.3/self_attn/Unsqueeze_5_output_0 '/blocks.3/self_attn/Constant_6_output_0 '/blocks.3/self_attn/Constant_7_output_0%/blocks.3/self_attn/Concat_2_output_0/blocks.3/self_attn/Concat_2"Concat* axis  */blocks.3/self_attn/k_proj/MatMul_output_0 %/blocks.3/self_attn/Concat_1_output_0&/blocks.3/self_attn/Reshape_1_output_0/blocks.3/self_attn/Reshape_1"Reshape* allowzero  */blocks.3/self_attn/v_proj/MatMul_output_0 %/blocks.3/self_attn/Concat_2_output_0&/blocks.3/self_attn/Reshape_2_output_0/blocks.3/self_attn/Reshape_2"Reshape* allowzero  $/blocks.3/self_attn/Reshape_output_0(/blocks.3/self_attn/q_norm/Cast_output_0/blocks.3/self_attn/q_norm/Cast"Cast* to ,/blocks.3/self_attn/q_norm/Constant_output_0#/blocks.3/self_attn/q_norm/Constant"Constant*E value*9B//blocks.3/self_attn/q_norm/Constant_attr::valueJ@  (/blocks.3/self_attn/q_norm/Cast_output_0 ,/blocks.3/self_attn/q_norm/Constant_output_0'/blocks.3/self_attn/q_norm/Pow_output_0/blocks.3/self_attn/q_norm/Pow"Pow  '/blocks.3/self_attn/q_norm/Pow_output_0./blocks.3/self_attn/q_norm/ReduceMean_output_0%/blocks.3/self_attn/q_norm/ReduceMean" ReduceMean* axes@* keepdims ./blocks.3/self_attn/q_norm/Constant_1_output_0%/blocks.3/self_attn/q_norm/Constant_1"Constant*G value*;B1/blocks.3/self_attn/q_norm/Constant_1_attr::valueJ75  ./blocks.3/self_attn/q_norm/ReduceMean_output_0 ./blocks.3/self_attn/q_norm/Constant_1_output_0'/blocks.3/self_attn/q_norm/Add_output_0/blocks.3/self_attn/q_norm/Add"Add z '/blocks.3/self_attn/q_norm/Add_output_0(/blocks.3/self_attn/q_norm/Sqrt_output_0/blocks.3/self_attn/q_norm/Sqrt"Sqrt ./blocks.3/self_attn/q_norm/Constant_2_output_0%/blocks.3/self_attn/q_norm/Constant_2"Constant*G value*;B1/blocks.3/self_attn/q_norm/Constant_2_attr::valueJ?  ./blocks.3/self_attn/q_norm/Constant_2_output_0 (/blocks.3/self_attn/q_norm/Sqrt_output_0'/blocks.3/self_attn/q_norm/Div_output_0/blocks.3/self_attn/q_norm/Div"Div  (/blocks.3/self_attn/q_norm/Cast_output_0*/blocks.3/self_attn/q_norm/Cast_1_output_0!/blocks.3/self_attn/q_norm/Cast_1"Cast* to  */blocks.3/self_attn/q_norm/Cast_1_output_0 '/blocks.3/self_attn/q_norm/Div_output_0'/blocks.3/self_attn/q_norm/Mul_output_0/blocks.3/self_attn/q_norm/Mul"Mul  '/blocks.3/self_attn/q_norm/Mul_output_0 blocks.3.self_attn.q_norm.weight)/blocks.3/self_attn/q_norm/Mul_1_output_0 /blocks.3/self_attn/q_norm/Mul_1"Mul  )/blocks.3/self_attn/q_norm/Mul_1_output_0*/blocks.3/self_attn/q_norm/Cast_2_output_0!/blocks.3/self_attn/q_norm/Cast_2"Cast* to  &/blocks.3/self_attn/Reshape_1_output_0(/blocks.3/self_attn/k_norm/Cast_output_0/blocks.3/self_attn/k_norm/Cast"Cast* to ,/blocks.3/self_attn/k_norm/Constant_output_0#/blocks.3/self_attn/k_norm/Constant"Constant*E value*9B//blocks.3/self_attn/k_norm/Constant_attr::valueJ@  (/blocks.3/self_attn/k_norm/Cast_output_0 ,/blocks.3/self_attn/k_norm/Constant_output_0'/blocks.3/self_attn/k_norm/Pow_output_0/blocks.3/self_attn/k_norm/Pow"Pow  '/blocks.3/self_attn/k_norm/Pow_output_0./blocks.3/self_attn/k_norm/ReduceMean_output_0%/blocks.3/self_attn/k_norm/ReduceMean" ReduceMean* axes@* keepdims ./blocks.3/self_attn/k_norm/Constant_1_output_0%/blocks.3/self_attn/k_norm/Constant_1"Constant*G value*;B1/blocks.3/self_attn/k_norm/Constant_1_attr::valueJ75  ./blocks.3/self_attn/k_norm/ReduceMean_output_0 ./blocks.3/self_attn/k_norm/Constant_1_output_0'/blocks.3/self_attn/k_norm/Add_output_0/blocks.3/self_attn/k_norm/Add"Add z '/blocks.3/self_attn/k_norm/Add_output_0(/blocks.3/self_attn/k_norm/Sqrt_output_0/blocks.3/self_attn/k_norm/Sqrt"Sqrt ./blocks.3/self_attn/k_norm/Constant_2_output_0%/blocks.3/self_attn/k_norm/Constant_2"Constant*G value*;B1/blocks.3/self_attn/k_norm/Constant_2_attr::valueJ?  ./blocks.3/self_attn/k_norm/Constant_2_output_0 (/blocks.3/self_attn/k_norm/Sqrt_output_0'/blocks.3/self_attn/k_norm/Div_output_0/blocks.3/self_attn/k_norm/Div"Div  (/blocks.3/self_attn/k_norm/Cast_output_0*/blocks.3/self_attn/k_norm/Cast_1_output_0!/blocks.3/self_attn/k_norm/Cast_1"Cast* to  */blocks.3/self_attn/k_norm/Cast_1_output_0 '/blocks.3/self_attn/k_norm/Div_output_0'/blocks.3/self_attn/k_norm/Mul_output_0/blocks.3/self_attn/k_norm/Mul"Mul  '/blocks.3/self_attn/k_norm/Mul_output_0 blocks.3.self_attn.k_norm.weight)/blocks.3/self_attn/k_norm/Mul_1_output_0 /blocks.3/self_attn/k_norm/Mul_1"Mul  )/blocks.3/self_attn/k_norm/Mul_1_output_0*/blocks.3/self_attn/k_norm/Cast_2_output_0!/blocks.3/self_attn/k_norm/Cast_2"Cast* to  */blocks.3/self_attn/q_norm/Cast_2_output_0 %/blocks.0/self_attn/Gather_2_output_0 /blocks.3/self_attn/Mul_output_0/blocks.3/self_attn/Mul"Mul v */blocks.3/self_attn/q_norm/Cast_2_output_0$/blocks.3/self_attn/Shape_2_output_0/blocks.3/self_attn/Shape_2"Shape '/blocks.3/self_attn/Constant_8_output_0/blocks.3/self_attn/Constant_8"Constant*D value*8B*/blocks.3/self_attn/Constant_8_attr::valueJ  $/blocks.3/self_attn/Shape_2_output_0 '/blocks.3/self_attn/Constant_8_output_0%/blocks.3/self_attn/Gather_2_output_0/blocks.3/self_attn/Gather_2"Gather* axis '/blocks.3/self_attn/Constant_9_output_0/blocks.3/self_attn/Constant_9"Constant*D value*8B*/blocks.3/self_attn/Constant_9_attr::valueJ  %/blocks.3/self_attn/Gather_2_output_0 '/blocks.3/self_attn/Constant_9_output_0 /blocks.3/self_attn/Div_output_0/blocks.3/self_attn/Div"Div p /blocks.3/self_attn/Div_output_0!/blocks.3/self_attn/Cast_output_0/blocks.3/self_attn/Cast"Cast* to u !/blocks.3/self_attn/Cast_output_0#/blocks.3/self_attn/Cast_1_output_0/blocks.3/self_attn/Cast_1"Cast* to (/blocks.3/self_attn/Constant_10_output_0/blocks.3/self_attn/Constant_10"Constant*G value*;B+/blocks.3/self_attn/Constant_10_attr::valueJ (/blocks.3/self_attn/Constant_11_output_0/blocks.3/self_attn/Constant_11"Constant*G value*;B+/blocks.3/self_attn/Constant_11_attr::valueJ (/blocks.3/self_attn/Constant_12_output_0/blocks.3/self_attn/Constant_12"Constant*G value*;B+/blocks.3/self_attn/Constant_12_attr::valueJ  #/blocks.3/self_attn/Cast_1_output_0 (/blocks.3/self_attn/Constant_12_output_0(/blocks.3/self_attn/Unsqueeze_6_output_0/blocks.3/self_attn/Unsqueeze_6" Unsqueeze (/blocks.3/self_attn/Constant_13_output_0/blocks.3/self_attn/Constant_13"Constant*G value*;B+/blocks.3/self_attn/Constant_13_attr::valueJ  */blocks.3/self_attn/q_norm/Cast_2_output_0 (/blocks.3/self_attn/Constant_11_output_0 (/blocks.3/self_attn/Unsqueeze_6_output_0 (/blocks.3/self_attn/Constant_10_output_0 (/blocks.3/self_attn/Constant_13_output_0"/blocks.3/self_attn/Slice_output_0/blocks.3/self_attn/Slice"Slice (/blocks.3/self_attn/Constant_14_output_0/blocks.3/self_attn/Constant_14"Constant*G value*;B+/blocks.3/self_attn/Constant_14_attr::valueJ (/blocks.3/self_attn/Constant_15_output_0/blocks.3/self_attn/Constant_15"Constant*G value*;B+/blocks.3/self_attn/Constant_15_attr::valueJ  #/blocks.3/self_attn/Cast_1_output_0 (/blocks.3/self_attn/Constant_15_output_0(/blocks.3/self_attn/Unsqueeze_7_output_0/blocks.3/self_attn/Unsqueeze_7" Unsqueeze (/blocks.3/self_attn/Constant_16_output_0/blocks.3/self_attn/Constant_16"Constant*G value*;B+/blocks.3/self_attn/Constant_16_attr::valueJ (/blocks.3/self_attn/Constant_17_output_0/blocks.3/self_attn/Constant_17"Constant*G value*;B+/blocks.3/self_attn/Constant_17_attr::valueJ  */blocks.3/self_attn/q_norm/Cast_2_output_0 (/blocks.3/self_attn/Unsqueeze_7_output_0 (/blocks.3/self_attn/Constant_16_output_0 (/blocks.3/self_attn/Constant_14_output_0 (/blocks.3/self_attn/Constant_17_output_0$/blocks.3/self_attn/Slice_1_output_0/blocks.3/self_attn/Slice_1"Slice f $/blocks.3/self_attn/Slice_1_output_0 /blocks.3/self_attn/Neg_output_0/blocks.3/self_attn/Neg"Neg  /blocks.3/self_attn/Neg_output_0 "/blocks.3/self_attn/Slice_output_0%/blocks.3/self_attn/Concat_3_output_0/blocks.3/self_attn/Concat_3"Concat* axis  %/blocks.3/self_attn/Concat_3_output_0 %/blocks.0/self_attn/Gather_3_output_0"/blocks.3/self_attn/Mul_1_output_0/blocks.3/self_attn/Mul_1"Mul  /blocks.3/self_attn/Mul_output_0 "/blocks.3/self_attn/Mul_1_output_0 /blocks.3/self_attn/Add_output_0/blocks.3/self_attn/Add"Add  */blocks.3/self_attn/k_norm/Cast_2_output_0 %/blocks.0/self_attn/Gather_2_output_0"/blocks.3/self_attn/Mul_2_output_0/blocks.3/self_attn/Mul_2"Mul v */blocks.3/self_attn/k_norm/Cast_2_output_0$/blocks.3/self_attn/Shape_3_output_0/blocks.3/self_attn/Shape_3"Shape (/blocks.3/self_attn/Constant_18_output_0/blocks.3/self_attn/Constant_18"Constant*E value*9B+/blocks.3/self_attn/Constant_18_attr::valueJ  $/blocks.3/self_attn/Shape_3_output_0 (/blocks.3/self_attn/Constant_18_output_0%/blocks.3/self_attn/Gather_3_output_0/blocks.3/self_attn/Gather_3"Gather* axis (/blocks.3/self_attn/Constant_19_output_0/blocks.3/self_attn/Constant_19"Constant*E value*9B+/blocks.3/self_attn/Constant_19_attr::valueJ  %/blocks.3/self_attn/Gather_3_output_0 (/blocks.3/self_attn/Constant_19_output_0"/blocks.3/self_attn/Div_1_output_0/blocks.3/self_attn/Div_1"Div v "/blocks.3/self_attn/Div_1_output_0#/blocks.3/self_attn/Cast_2_output_0/blocks.3/self_attn/Cast_2"Cast* to w #/blocks.3/self_attn/Cast_2_output_0#/blocks.3/self_attn/Cast_3_output_0/blocks.3/self_attn/Cast_3"Cast* to (/blocks.3/self_attn/Constant_20_output_0/blocks.3/self_attn/Constant_20"Constant*G value*;B+/blocks.3/self_attn/Constant_20_attr::valueJ (/blocks.3/self_attn/Constant_21_output_0/blocks.3/self_attn/Constant_21"Constant*G value*;B+/blocks.3/self_attn/Constant_21_attr::valueJ (/blocks.3/self_attn/Constant_22_output_0/blocks.3/self_attn/Constant_22"Constant*G value*;B+/blocks.3/self_attn/Constant_22_attr::valueJ  #/blocks.3/self_attn/Cast_3_output_0 (/blocks.3/self_attn/Constant_22_output_0(/blocks.3/self_attn/Unsqueeze_8_output_0/blocks.3/self_attn/Unsqueeze_8" Unsqueeze (/blocks.3/self_attn/Constant_23_output_0/blocks.3/self_attn/Constant_23"Constant*G value*;B+/blocks.3/self_attn/Constant_23_attr::valueJ  */blocks.3/self_attn/k_norm/Cast_2_output_0 (/blocks.3/self_attn/Constant_21_output_0 (/blocks.3/self_attn/Unsqueeze_8_output_0 (/blocks.3/self_attn/Constant_20_output_0 (/blocks.3/self_attn/Constant_23_output_0$/blocks.3/self_attn/Slice_2_output_0/blocks.3/self_attn/Slice_2"Slice (/blocks.3/self_attn/Constant_24_output_0/blocks.3/self_attn/Constant_24"Constant*G value*;B+/blocks.3/self_attn/Constant_24_attr::valueJ (/blocks.3/self_attn/Constant_25_output_0/blocks.3/self_attn/Constant_25"Constant*G value*;B+/blocks.3/self_attn/Constant_25_attr::valueJ  #/blocks.3/self_attn/Cast_3_output_0 (/blocks.3/self_attn/Constant_25_output_0(/blocks.3/self_attn/Unsqueeze_9_output_0/blocks.3/self_attn/Unsqueeze_9" Unsqueeze (/blocks.3/self_attn/Constant_26_output_0/blocks.3/self_attn/Constant_26"Constant*G value*;B+/blocks.3/self_attn/Constant_26_attr::valueJ (/blocks.3/self_attn/Constant_27_output_0/blocks.3/self_attn/Constant_27"Constant*G value*;B+/blocks.3/self_attn/Constant_27_attr::valueJ  */blocks.3/self_attn/k_norm/Cast_2_output_0 (/blocks.3/self_attn/Unsqueeze_9_output_0 (/blocks.3/self_attn/Constant_26_output_0 (/blocks.3/self_attn/Constant_24_output_0 (/blocks.3/self_attn/Constant_27_output_0$/blocks.3/self_attn/Slice_3_output_0/blocks.3/self_attn/Slice_3"Slice j $/blocks.3/self_attn/Slice_3_output_0"/blocks.3/self_attn/Neg_1_output_0/blocks.3/self_attn/Neg_1"Neg  "/blocks.3/self_attn/Neg_1_output_0 $/blocks.3/self_attn/Slice_2_output_0%/blocks.3/self_attn/Concat_4_output_0/blocks.3/self_attn/Concat_4"Concat* axis  %/blocks.3/self_attn/Concat_4_output_0 %/blocks.0/self_attn/Gather_3_output_0"/blocks.3/self_attn/Mul_3_output_0/blocks.3/self_attn/Mul_3"Mul  "/blocks.3/self_attn/Mul_2_output_0 "/blocks.3/self_attn/Mul_3_output_0"/blocks.3/self_attn/Add_1_output_0/blocks.3/self_attn/Add_1"Add  /Gather_3_output_0 /rotary/Constant_3_output_0%/blocks.3/self_attn/Gather_4_output_0/blocks.3/self_attn/Gather_4"Gather* axis  /Gather_3_output_0 /rotary/Constant_8_output_0%/blocks.3/self_attn/Gather_5_output_0/blocks.3/self_attn/Gather_5"Gather* axis  %/blocks.3/self_attn/Gather_4_output_0 "/blocks.3/self_attn/Add_1_output_0%/blocks.3/self_attn/Concat_5_output_0/blocks.3/self_attn/Concat_5"Concat* axis  %/blocks.3/self_attn/Gather_5_output_0 &/blocks.3/self_attn/Reshape_2_output_0%/blocks.3/self_attn/Concat_6_output_0/blocks.3/self_attn/Concat_6"Concat* axis (/blocks.3/self_attn/Constant_28_output_0/blocks.3/self_attn/Constant_28"Constant*G value*;B+/blocks.3/self_attn/Constant_28_attr::valueJ  %/blocks.3/self_attn/Concat_5_output_0 (/blocks.3/self_attn/Constant_28_output_0)/blocks.3/self_attn/Unsqueeze_10_output_0 /blocks.3/self_attn/Unsqueeze_10" Unsqueeze (/blocks.3/self_attn/Constant_29_output_0/blocks.3/self_attn/Constant_29"Constant*G value*;B+/blocks.3/self_attn/Constant_29_attr::valueJ  %/blocks.3/self_attn/Concat_6_output_0 (/blocks.3/self_attn/Constant_29_output_0)/blocks.3/self_attn/Unsqueeze_11_output_0 /blocks.3/self_attn/Unsqueeze_11" Unsqueeze  )/blocks.3/self_attn/Unsqueeze_10_output_0 )/blocks.3/self_attn/Unsqueeze_11_output_0%/blocks.3/self_attn/Concat_7_output_0/blocks.3/self_attn/Concat_7"Concat* axis  /blocks.3/self_attn/Add_output_0&/blocks.3/self_attn/Transpose_output_0/blocks.3/self_attn/Transpose" Transpose* perm@@@@  %/blocks.3/self_attn/Concat_5_output_0(/blocks.3/self_attn/Transpose_1_output_0/blocks.3/self_attn/Transpose_1" Transpose* perm@@@@  %/blocks.3/self_attn/Concat_6_output_0(/blocks.3/self_attn/Transpose_2_output_0/blocks.3/self_attn/Transpose_2" Transpose* perm@@@@ t (/blocks.3/self_attn/Transpose_1_output_0$/blocks.3/self_attn/Shape_4_output_0/blocks.3/self_attn/Shape_4"Shape (/blocks.3/self_attn/Constant_30_output_0/blocks.3/self_attn/Constant_30"Constant*E value*9B+/blocks.3/self_attn/Constant_30_attr::valueJ  $/blocks.3/self_attn/Shape_4_output_0 (/blocks.3/self_attn/Constant_30_output_0%/blocks.3/self_attn/Gather_6_output_0/blocks.3/self_attn/Gather_6"Gather* axis t (/blocks.3/self_attn/Transpose_1_output_0$/blocks.3/self_attn/Shape_5_output_0/blocks.3/self_attn/Shape_5"Shape (/blocks.3/self_attn/Constant_31_output_0/blocks.3/self_attn/Constant_31"Constant*E value*9B+/blocks.3/self_attn/Constant_31_attr::valueJ  $/blocks.3/self_attn/Shape_5_output_0 (/blocks.3/self_attn/Constant_31_output_0%/blocks.3/self_attn/Gather_7_output_0/blocks.3/self_attn/Gather_7"Gather* axis t (/blocks.3/self_attn/Transpose_1_output_0$/blocks.3/self_attn/Shape_6_output_0/blocks.3/self_attn/Shape_6"Shape (/blocks.3/self_attn/Constant_32_output_0/blocks.3/self_attn/Constant_32"Constant*E value*9B+/blocks.3/self_attn/Constant_32_attr::valueJ  $/blocks.3/self_attn/Shape_6_output_0 (/blocks.3/self_attn/Constant_32_output_0%/blocks.3/self_attn/Gather_8_output_0/blocks.3/self_attn/Gather_8"Gather* axis t (/blocks.3/self_attn/Transpose_1_output_0$/blocks.3/self_attn/Shape_7_output_0/blocks.3/self_attn/Shape_7"Shape (/blocks.3/self_attn/Constant_33_output_0/blocks.3/self_attn/Constant_33"Constant*E value*9B+/blocks.3/self_attn/Constant_33_attr::valueJ  $/blocks.3/self_attn/Shape_7_output_0 (/blocks.3/self_attn/Constant_33_output_0%/blocks.3/self_attn/Gather_9_output_0/blocks.3/self_attn/Gather_9"Gather* axis (/blocks.3/self_attn/Constant_34_output_0/blocks.3/self_attn/Constant_34"Constant*G value*;B+/blocks.3/self_attn/Constant_34_attr::valueJ  (/blocks.3/self_attn/Transpose_1_output_0 (/blocks.3/self_attn/Constant_34_output_0)/blocks.3/self_attn/Unsqueeze_12_output_0 /blocks.3/self_attn/Unsqueeze_12" Unsqueeze (/blocks.3/self_attn/Constant_35_output_0/blocks.3/self_attn/Constant_35"Constant*G value*;B+/blocks.3/self_attn/Constant_35_attr::valueJ  %/blocks.3/self_attn/Gather_6_output_0 (/blocks.3/self_attn/Constant_35_output_0)/blocks.3/self_attn/Unsqueeze_13_output_0 /blocks.3/self_attn/Unsqueeze_13" Unsqueeze (/blocks.3/self_attn/Constant_36_output_0/blocks.3/self_attn/Constant_36"Constant*G value*;B+/blocks.3/self_attn/Constant_36_attr::valueJ  %/blocks.3/self_attn/Gather_7_output_0 (/blocks.3/self_attn/Constant_36_output_0)/blocks.3/self_attn/Unsqueeze_14_output_0 /blocks.3/self_attn/Unsqueeze_14" Unsqueeze (/blocks.3/self_attn/Constant_37_output_0/blocks.3/self_attn/Constant_37"Constant*G value*;B+/blocks.3/self_attn/Constant_37_attr::valueJ (/blocks.3/self_attn/Constant_38_output_0/blocks.3/self_attn/Constant_38"Constant*G value*;B+/blocks.3/self_attn/Constant_38_attr::valueJ  %/blocks.3/self_attn/Gather_8_output_0 (/blocks.3/self_attn/Constant_38_output_0)/blocks.3/self_attn/Unsqueeze_15_output_0 /blocks.3/self_attn/Unsqueeze_15" Unsqueeze (/blocks.3/self_attn/Constant_39_output_0/blocks.3/self_attn/Constant_39"Constant*G value*;B+/blocks.3/self_attn/Constant_39_attr::valueJ  %/blocks.3/self_attn/Gather_9_output_0 (/blocks.3/self_attn/Constant_39_output_0)/blocks.3/self_attn/Unsqueeze_16_output_0 /blocks.3/self_attn/Unsqueeze_16" Unsqueeze  )/blocks.3/self_attn/Unsqueeze_13_output_0 )/blocks.3/self_attn/Unsqueeze_14_output_0 (/blocks.3/self_attn/Constant_37_output_0 )/blocks.3/self_attn/Unsqueeze_15_output_0 )/blocks.3/self_attn/Unsqueeze_16_output_0%/blocks.3/self_attn/Concat_8_output_0/blocks.3/self_attn/Concat_8"Concat* axis (/blocks.3/self_attn/Constant_40_output_0/blocks.3/self_attn/Constant_40"Constant*G value*;B+/blocks.3/self_attn/Constant_40_attr::valueJ  %/blocks.3/self_attn/Concat_8_output_0 (/blocks.3/self_attn/Constant_40_output_0&/blocks.3/self_attn/Reshape_3_output_0/blocks.3/self_attn/Reshape_3"Reshape* allowzero r &/blocks.3/self_attn/Reshape_3_output_0$/blocks.3/self_attn/Shape_8_output_0/blocks.3/self_attn/Shape_8"Shape  $/blocks.3/self_attn/Shape_8_output_0,/blocks.3/self_attn/ConstantOfShape_output_0#/blocks.3/self_attn/ConstantOfShape"ConstantOfShape*K value*?B//blocks.3/self_attn/ConstantOfShape_attr::valueJ (/blocks.3/self_attn/Constant_41_output_0/blocks.3/self_attn/Constant_41"Constant*E value*9B+/blocks.3/self_attn/Constant_41_attr::valueJ  ,/blocks.3/self_attn/ConstantOfShape_output_0 (/blocks.3/self_attn/Constant_41_output_0"/blocks.3/self_attn/Mul_4_output_0/blocks.3/self_attn/Mul_4"Mul  &/blocks.3/self_attn/Reshape_3_output_0 "/blocks.3/self_attn/Mul_4_output_0"/blocks.3/self_attn/Equal_output_0/blocks.3/self_attn/Equal"Equal  "/blocks.3/self_attn/Equal_output_0 ,/blocks.3/self_attn/ConstantOfShape_output_0 &/blocks.3/self_attn/Reshape_3_output_0"/blocks.3/self_attn/Where_output_0/blocks.3/self_attn/Where"Where  )/blocks.3/self_attn/Unsqueeze_12_output_0 "/blocks.3/self_attn/Where_output_0#/blocks.3/self_attn/Expand_output_0/blocks.3/self_attn/Expand"Expand (/blocks.3/self_attn/Constant_42_output_0/blocks.3/self_attn/Constant_42"Constant*E value*9B+/blocks.3/self_attn/Constant_42_attr::valueJ  %/blocks.3/self_attn/Gather_7_output_0 (/blocks.3/self_attn/Constant_42_output_0"/blocks.3/self_attn/Mul_5_output_0/blocks.3/self_attn/Mul_5"Mul fonnx::Unsqueeze_1408 Constant_3487"Constant*5 value*)BConstant_3487_attr::valueJ  %/blocks.3/self_attn/Gather_6_output_0 onnx::Unsqueeze_1408)/blocks.3/self_attn/Unsqueeze_17_output_0 /blocks.3/self_attn/Unsqueeze_17" Unsqueeze fonnx::Unsqueeze_1410 Constant_3489"Constant*5 value*)BConstant_3489_attr::valueJ  "/blocks.3/self_attn/Mul_5_output_0 onnx::Unsqueeze_1410)/blocks.3/self_attn/Unsqueeze_18_output_0 /blocks.3/self_attn/Unsqueeze_18" Unsqueeze fonnx::Unsqueeze_1412 Constant_3491"Constant*5 value*)BConstant_3491_attr::valueJ  %/blocks.3/self_attn/Gather_8_output_0 onnx::Unsqueeze_1412)/blocks.3/self_attn/Unsqueeze_19_output_0 /blocks.3/self_attn/Unsqueeze_19" Unsqueeze fonnx::Unsqueeze_1414 Constant_3493"Constant*5 value*)BConstant_3493_attr::valueJ  %/blocks.3/self_attn/Gather_9_output_0 onnx::Unsqueeze_1414)/blocks.3/self_attn/Unsqueeze_20_output_0 /blocks.3/self_attn/Unsqueeze_20" Unsqueeze  )/blocks.3/self_attn/Unsqueeze_17_output_0 )/blocks.3/self_attn/Unsqueeze_18_output_0 )/blocks.3/self_attn/Unsqueeze_19_output_0 )/blocks.3/self_attn/Unsqueeze_20_output_0%/blocks.3/self_attn/Concat_9_output_0/blocks.3/self_attn/Concat_9"Concat* axis  #/blocks.3/self_attn/Expand_output_0 %/blocks.3/self_attn/Concat_9_output_0&/blocks.3/self_attn/Reshape_4_output_0/blocks.3/self_attn/Reshape_4"Reshape* allowzero t (/blocks.3/self_attn/Transpose_2_output_0$/blocks.3/self_attn/Shape_9_output_0/blocks.3/self_attn/Shape_9"Shape (/blocks.3/self_attn/Constant_43_output_0/blocks.3/self_attn/Constant_43"Constant*E value*9B+/blocks.3/self_attn/Constant_43_attr::valueJ  $/blocks.3/self_attn/Shape_9_output_0 (/blocks.3/self_attn/Constant_43_output_0&/blocks.3/self_attn/Gather_10_output_0/blocks.3/self_attn/Gather_10"Gather* axis v (/blocks.3/self_attn/Transpose_2_output_0%/blocks.3/self_attn/Shape_10_output_0/blocks.3/self_attn/Shape_10"Shape (/blocks.3/self_attn/Constant_44_output_0/blocks.3/self_attn/Constant_44"Constant*E value*9B+/blocks.3/self_attn/Constant_44_attr::valueJ  %/blocks.3/self_attn/Shape_10_output_0 (/blocks.3/self_attn/Constant_44_output_0&/blocks.3/self_attn/Gather_11_output_0/blocks.3/self_attn/Gather_11"Gather* axis v (/blocks.3/self_attn/Transpose_2_output_0%/blocks.3/self_attn/Shape_11_output_0/blocks.3/self_attn/Shape_11"Shape (/blocks.3/self_attn/Constant_45_output_0/blocks.3/self_attn/Constant_45"Constant*E value*9B+/blocks.3/self_attn/Constant_45_attr::valueJ  %/blocks.3/self_attn/Shape_11_output_0 (/blocks.3/self_attn/Constant_45_output_0&/blocks.3/self_attn/Gather_12_output_0/blocks.3/self_attn/Gather_12"Gather* axis v (/blocks.3/self_attn/Transpose_2_output_0%/blocks.3/self_attn/Shape_12_output_0/blocks.3/self_attn/Shape_12"Shape (/blocks.3/self_attn/Constant_46_output_0/blocks.3/self_attn/Constant_46"Constant*E value*9B+/blocks.3/self_attn/Constant_46_attr::valueJ  %/blocks.3/self_attn/Shape_12_output_0 (/blocks.3/self_attn/Constant_46_output_0&/blocks.3/self_attn/Gather_13_output_0/blocks.3/self_attn/Gather_13"Gather* axis (/blocks.3/self_attn/Constant_47_output_0/blocks.3/self_attn/Constant_47"Constant*G value*;B+/blocks.3/self_attn/Constant_47_attr::valueJ  (/blocks.3/self_attn/Transpose_2_output_0 (/blocks.3/self_attn/Constant_47_output_0)/blocks.3/self_attn/Unsqueeze_21_output_0 /blocks.3/self_attn/Unsqueeze_21" Unsqueeze (/blocks.3/self_attn/Constant_48_output_0/blocks.3/self_attn/Constant_48"Constant*G value*;B+/blocks.3/self_attn/Constant_48_attr::valueJ  &/blocks.3/self_attn/Gather_10_output_0 (/blocks.3/self_attn/Constant_48_output_0)/blocks.3/self_attn/Unsqueeze_22_output_0 /blocks.3/self_attn/Unsqueeze_22" Unsqueeze (/blocks.3/self_attn/Constant_49_output_0/blocks.3/self_attn/Constant_49"Constant*G value*;B+/blocks.3/self_attn/Constant_49_attr::valueJ  &/blocks.3/self_attn/Gather_11_output_0 (/blocks.3/self_attn/Constant_49_output_0)/blocks.3/self_attn/Unsqueeze_23_output_0 /blocks.3/self_attn/Unsqueeze_23" Unsqueeze (/blocks.3/self_attn/Constant_50_output_0/blocks.3/self_attn/Constant_50"Constant*G value*;B+/blocks.3/self_attn/Constant_50_attr::valueJ (/blocks.3/self_attn/Constant_51_output_0/blocks.3/self_attn/Constant_51"Constant*G value*;B+/blocks.3/self_attn/Constant_51_attr::valueJ  &/blocks.3/self_attn/Gather_12_output_0 (/blocks.3/self_attn/Constant_51_output_0)/blocks.3/self_attn/Unsqueeze_24_output_0 /blocks.3/self_attn/Unsqueeze_24" Unsqueeze (/blocks.3/self_attn/Constant_52_output_0/blocks.3/self_attn/Constant_52"Constant*G value*;B+/blocks.3/self_attn/Constant_52_attr::valueJ  &/blocks.3/self_attn/Gather_13_output_0 (/blocks.3/self_attn/Constant_52_output_0)/blocks.3/self_attn/Unsqueeze_25_output_0 /blocks.3/self_attn/Unsqueeze_25" Unsqueeze  )/blocks.3/self_attn/Unsqueeze_22_output_0 )/blocks.3/self_attn/Unsqueeze_23_output_0 (/blocks.3/self_attn/Constant_50_output_0 )/blocks.3/self_attn/Unsqueeze_24_output_0 )/blocks.3/self_attn/Unsqueeze_25_output_0&/blocks.3/self_attn/Concat_10_output_0/blocks.3/self_attn/Concat_10"Concat* axis (/blocks.3/self_attn/Constant_53_output_0/blocks.3/self_attn/Constant_53"Constant*G value*;B+/blocks.3/self_attn/Constant_53_attr::valueJ  &/blocks.3/self_attn/Concat_10_output_0 (/blocks.3/self_attn/Constant_53_output_0&/blocks.3/self_attn/Reshape_5_output_0/blocks.3/self_attn/Reshape_5"Reshape* allowzero t &/blocks.3/self_attn/Reshape_5_output_0%/blocks.3/self_attn/Shape_13_output_0/blocks.3/self_attn/Shape_13"Shape  %/blocks.3/self_attn/Shape_13_output_0./blocks.3/self_attn/ConstantOfShape_1_output_0%/blocks.3/self_attn/ConstantOfShape_1"ConstantOfShape*M value*AB1/blocks.3/self_attn/ConstantOfShape_1_attr::valueJ (/blocks.3/self_attn/Constant_54_output_0/blocks.3/self_attn/Constant_54"Constant*E value*9B+/blocks.3/self_attn/Constant_54_attr::valueJ  ./blocks.3/self_attn/ConstantOfShape_1_output_0 (/blocks.3/self_attn/Constant_54_output_0"/blocks.3/self_attn/Mul_6_output_0/blocks.3/self_attn/Mul_6"Mul  &/blocks.3/self_attn/Reshape_5_output_0 "/blocks.3/self_attn/Mul_6_output_0$/blocks.3/self_attn/Equal_1_output_0/blocks.3/self_attn/Equal_1"Equal  $/blocks.3/self_attn/Equal_1_output_0 ./blocks.3/self_attn/ConstantOfShape_1_output_0 &/blocks.3/self_attn/Reshape_5_output_0$/blocks.3/self_attn/Where_1_output_0/blocks.3/self_attn/Where_1"Where  )/blocks.3/self_attn/Unsqueeze_21_output_0 $/blocks.3/self_attn/Where_1_output_0%/blocks.3/self_attn/Expand_1_output_0/blocks.3/self_attn/Expand_1"Expand (/blocks.3/self_attn/Constant_55_output_0/blocks.3/self_attn/Constant_55"Constant*E value*9B+/blocks.3/self_attn/Constant_55_attr::valueJ  &/blocks.3/self_attn/Gather_11_output_0 (/blocks.3/self_attn/Constant_55_output_0"/blocks.3/self_attn/Mul_7_output_0/blocks.3/self_attn/Mul_7"Mul fonnx::Unsqueeze_1454 Constant_3532"Constant*5 value*)BConstant_3532_attr::valueJ  &/blocks.3/self_attn/Gather_10_output_0 onnx::Unsqueeze_1454)/blocks.3/self_attn/Unsqueeze_26_output_0 /blocks.3/self_attn/Unsqueeze_26" Unsqueeze fonnx::Unsqueeze_1456 Constant_3534"Constant*5 value*)BConstant_3534_attr::valueJ  "/blocks.3/self_attn/Mul_7_output_0 onnx::Unsqueeze_1456)/blocks.3/self_attn/Unsqueeze_27_output_0 /blocks.3/self_attn/Unsqueeze_27" Unsqueeze fonnx::Unsqueeze_1458 Constant_3536"Constant*5 value*)BConstant_3536_attr::valueJ  &/blocks.3/self_attn/Gather_12_output_0 onnx::Unsqueeze_1458)/blocks.3/self_attn/Unsqueeze_28_output_0 /blocks.3/self_attn/Unsqueeze_28" Unsqueeze fonnx::Unsqueeze_1460 Constant_3538"Constant*5 value*)BConstant_3538_attr::valueJ  &/blocks.3/self_attn/Gather_13_output_0 onnx::Unsqueeze_1460)/blocks.3/self_attn/Unsqueeze_29_output_0 /blocks.3/self_attn/Unsqueeze_29" Unsqueeze  )/blocks.3/self_attn/Unsqueeze_26_output_0 )/blocks.3/self_attn/Unsqueeze_27_output_0 )/blocks.3/self_attn/Unsqueeze_28_output_0 )/blocks.3/self_attn/Unsqueeze_29_output_0&/blocks.3/self_attn/Concat_11_output_0/blocks.3/self_attn/Concat_11"Concat* axis  %/blocks.3/self_attn/Expand_1_output_0 &/blocks.3/self_attn/Concat_11_output_0&/blocks.3/self_attn/Reshape_6_output_0/blocks.3/self_attn/Reshape_6"Reshape* allowzero  &/blocks.3/self_attn/Transpose_output_0 &/blocks.3/self_attn/Reshape_4_output_0#/blocks.3/self_attn/MatMul_output_0/blocks.3/self_attn/MatMul"MatMul (/blocks.3/self_attn/Constant_56_output_0/blocks.3/self_attn/Constant_56"Constant*A value*5B+/blocks.3/self_attn/Constant_56_attr::valueJ5A  #/blocks.3/self_attn/MatMul_output_0 (/blocks.3/self_attn/Constant_56_output_0"/blocks.3/self_attn/Div_2_output_0/blocks.3/self_attn/Div_2"Div x "/blocks.3/self_attn/Div_2_output_0 attention_mask"/blocks.3/self_attn/Add_2_output_0/blocks.3/self_attn/Add_2"Add  "/blocks.3/self_attn/Add_2_output_0$/blocks.3/self_attn/Softmax_output_0/blocks.3/self_attn/Softmax"Softmax* axis x $/blocks.3/self_attn/Softmax_output_0#/blocks.3/self_attn/Cast_4_output_0/blocks.3/self_attn/Cast_4"Cast* to  #/blocks.3/self_attn/Cast_4_output_0 &/blocks.3/self_attn/Reshape_6_output_0%/blocks.3/self_attn/MatMul_1_output_0/blocks.3/self_attn/MatMul_1"MatMul  %/blocks.3/self_attn/MatMul_1_output_0(/blocks.3/self_attn/Transpose_3_output_0/blocks.3/self_attn/Transpose_3" Transpose* perm@@@@ fonnx::Unsqueeze_1472 Constant_3550"Constant*5 value*)BConstant_3550_attr::valueJ  #/blocks.3/self_attn/Gather_output_0 onnx::Unsqueeze_1472)/blocks.3/self_attn/Unsqueeze_30_output_0 /blocks.3/self_attn/Unsqueeze_30" Unsqueeze fonnx::Unsqueeze_1474 Constant_3552"Constant*5 value*)BConstant_3552_attr::valueJ  %/blocks.3/self_attn/Gather_1_output_0 onnx::Unsqueeze_1474)/blocks.3/self_attn/Unsqueeze_31_output_0 /blocks.3/self_attn/Unsqueeze_31" Unsqueeze (/blocks.3/self_attn/Constant_57_output_0/blocks.3/self_attn/Constant_57"Constant*G value*;B+/blocks.3/self_attn/Constant_57_attr::valueJ  )/blocks.3/self_attn/Unsqueeze_30_output_0 )/blocks.3/self_attn/Unsqueeze_31_output_0 (/blocks.3/self_attn/Constant_57_output_0&/blocks.3/self_attn/Concat_12_output_0/blocks.3/self_attn/Concat_12"Concat* axis  (/blocks.3/self_attn/Transpose_3_output_0 &/blocks.3/self_attn/Concat_12_output_0&/blocks.3/self_attn/Reshape_7_output_0/blocks.3/self_attn/Reshape_7"Reshape* allowzero  &/blocks.3/self_attn/Reshape_7_output_0 onnx::MatMul_8673*/blocks.3/self_attn/o_proj/MatMul_output_0!/blocks.3/self_attn/o_proj/MatMul"MatMul  )/blocks.3/input_layernorm/Cast_1_output_0 */blocks.3/self_attn/o_proj/MatMul_output_0/blocks.3/Add_output_0 /blocks.3/Add"Add  /blocks.3/Add_output_00/blocks.3/post_attention_layernorm/Cast_output_0'/blocks.3/post_attention_layernorm/Cast"Cast* to 4/blocks.3/post_attention_layernorm/Constant_output_0+/blocks.3/post_attention_layernorm/Constant"Constant*M value*AB7/blocks.3/post_attention_layernorm/Constant_attr::valueJ@  0/blocks.3/post_attention_layernorm/Cast_output_0 4/blocks.3/post_attention_layernorm/Constant_output_0//blocks.3/post_attention_layernorm/Pow_output_0&/blocks.3/post_attention_layernorm/Pow"Pow  //blocks.3/post_attention_layernorm/Pow_output_06/blocks.3/post_attention_layernorm/ReduceMean_output_0-/blocks.3/post_attention_layernorm/ReduceMean" ReduceMean* axes@* keepdims 6/blocks.3/post_attention_layernorm/Constant_1_output_0-/blocks.3/post_attention_layernorm/Constant_1"Constant*O value*CB9/blocks.3/post_attention_layernorm/Constant_1_attr::valueJ75  6/blocks.3/post_attention_layernorm/ReduceMean_output_0 6/blocks.3/post_attention_layernorm/Constant_1_output_0//blocks.3/post_attention_layernorm/Add_output_0&/blocks.3/post_attention_layernorm/Add"Add  //blocks.3/post_attention_layernorm/Add_output_00/blocks.3/post_attention_layernorm/Sqrt_output_0'/blocks.3/post_attention_layernorm/Sqrt"Sqrt 6/blocks.3/post_attention_layernorm/Constant_2_output_0-/blocks.3/post_attention_layernorm/Constant_2"Constant*O value*CB9/blocks.3/post_attention_layernorm/Constant_2_attr::valueJ?  6/blocks.3/post_attention_layernorm/Constant_2_output_0 0/blocks.3/post_attention_layernorm/Sqrt_output_0//blocks.3/post_attention_layernorm/Div_output_0&/blocks.3/post_attention_layernorm/Div"Div  0/blocks.3/post_attention_layernorm/Cast_output_02/blocks.3/post_attention_layernorm/Cast_1_output_0)/blocks.3/post_attention_layernorm/Cast_1"Cast* to  2/blocks.3/post_attention_layernorm/Cast_1_output_0 //blocks.3/post_attention_layernorm/Div_output_0//blocks.3/post_attention_layernorm/Mul_output_0&/blocks.3/post_attention_layernorm/Mul"Mul  //blocks.3/post_attention_layernorm/Mul_output_0 (blocks.3.post_attention_layernorm.weight1/blocks.3/post_attention_layernorm/Mul_1_output_0(/blocks.3/post_attention_layernorm/Mul_1"Mul  1/blocks.3/post_attention_layernorm/Mul_1_output_02/blocks.3/post_attention_layernorm/Cast_2_output_0)/blocks.3/post_attention_layernorm/Cast_2"Cast* to  2/blocks.3/post_attention_layernorm/Cast_2_output_0 onnx::MatMul_8674'/blocks.3/mlp/gate_proj/MatMul_output_0/blocks.3/mlp/gate_proj/MatMul"MatMul w '/blocks.3/mlp/gate_proj/MatMul_output_0%/blocks.3/mlp/act_fn/Sigmoid_output_0/blocks.3/mlp/act_fn/Sigmoid"Sigmoid  '/blocks.3/mlp/gate_proj/MatMul_output_0 %/blocks.3/mlp/act_fn/Sigmoid_output_0!/blocks.3/mlp/act_fn/Mul_output_0/blocks.3/mlp/act_fn/Mul"Mul  2/blocks.3/post_attention_layernorm/Cast_2_output_0 onnx::MatMul_8675%/blocks.3/mlp/up_proj/MatMul_output_0/blocks.3/mlp/up_proj/MatMul"MatMul ~ !/blocks.3/mlp/act_fn/Mul_output_0 %/blocks.3/mlp/up_proj/MatMul_output_0/blocks.3/mlp/Mul_output_0/blocks.3/mlp/Mul"Mul  /blocks.3/mlp/Mul_output_0 onnx::MatMul_8676'/blocks.3/mlp/down_proj/MatMul_output_0/blocks.3/mlp/down_proj/MatMul"MatMul  2/blocks.3/post_attention_layernorm/Cast_1_output_0 '/blocks.3/mlp/down_proj/MatMul_output_0/blocks.3/Add_1_output_0/blocks.3/Add_1"Add o past_key_values (/blocks.0/self_attn/Constant_38_output_0/Gather_4_output_0 /Gather_4"Gather* axis /blocks.4/Constant_output_0/blocks.4/Constant"Constant*J value*>B/blocks.4/Constant_attr::valueJ  /blocks.3/Add_1_output_0 /blocks.4/Constant_output_0/blocks.4/Reshape_output_0/blocks.4/Reshape"Reshape* allowzero v /blocks.4/Reshape_output_0'/blocks.4/input_layernorm/Cast_output_0/blocks.4/input_layernorm/Cast"Cast* to +/blocks.4/input_layernorm/Constant_output_0"/blocks.4/input_layernorm/Constant"Constant*D value*8B./blocks.4/input_layernorm/Constant_attr::valueJ@  '/blocks.4/input_layernorm/Cast_output_0 +/blocks.4/input_layernorm/Constant_output_0&/blocks.4/input_layernorm/Pow_output_0/blocks.4/input_layernorm/Pow"Pow  &/blocks.4/input_layernorm/Pow_output_0-/blocks.4/input_layernorm/ReduceMean_output_0$/blocks.4/input_layernorm/ReduceMean" ReduceMean* axes@* keepdims -/blocks.4/input_layernorm/Constant_1_output_0$/blocks.4/input_layernorm/Constant_1"Constant*F value*:B0/blocks.4/input_layernorm/Constant_1_attr::valueJ75  -/blocks.4/input_layernorm/ReduceMean_output_0 -/blocks.4/input_layernorm/Constant_1_output_0&/blocks.4/input_layernorm/Add_output_0/blocks.4/input_layernorm/Add"Add w &/blocks.4/input_layernorm/Add_output_0'/blocks.4/input_layernorm/Sqrt_output_0/blocks.4/input_layernorm/Sqrt"Sqrt -/blocks.4/input_layernorm/Constant_2_output_0$/blocks.4/input_layernorm/Constant_2"Constant*F value*:B0/blocks.4/input_layernorm/Constant_2_attr::valueJ?  -/blocks.4/input_layernorm/Constant_2_output_0 '/blocks.4/input_layernorm/Sqrt_output_0&/blocks.4/input_layernorm/Div_output_0/blocks.4/input_layernorm/Div"Div  '/blocks.4/input_layernorm/Cast_output_0)/blocks.4/input_layernorm/Cast_1_output_0 /blocks.4/input_layernorm/Cast_1"Cast* to  )/blocks.4/input_layernorm/Cast_1_output_0 &/blocks.4/input_layernorm/Div_output_0&/blocks.4/input_layernorm/Mul_output_0/blocks.4/input_layernorm/Mul"Mul  &/blocks.4/input_layernorm/Mul_output_0 blocks.4.input_layernorm.weight(/blocks.4/input_layernorm/Mul_1_output_0/blocks.4/input_layernorm/Mul_1"Mul  (/blocks.4/input_layernorm/Mul_1_output_0)/blocks.4/input_layernorm/Cast_2_output_0 /blocks.4/input_layernorm/Cast_2"Cast* to q )/blocks.4/input_layernorm/Cast_2_output_0"/blocks.4/self_attn/Shape_output_0/blocks.4/self_attn/Shape"Shape %/blocks.4/self_attn/Constant_output_0/blocks.4/self_attn/Constant"Constant*B value*6B(/blocks.4/self_attn/Constant_attr::valueJ  "/blocks.4/self_attn/Shape_output_0 %/blocks.4/self_attn/Constant_output_0#/blocks.4/self_attn/Gather_output_0/blocks.4/self_attn/Gather"Gather* axis u )/blocks.4/input_layernorm/Cast_2_output_0$/blocks.4/self_attn/Shape_1_output_0/blocks.4/self_attn/Shape_1"Shape '/blocks.4/self_attn/Constant_1_output_0/blocks.4/self_attn/Constant_1"Constant*D value*8B*/blocks.4/self_attn/Constant_1_attr::valueJ  $/blocks.4/self_attn/Shape_1_output_0 '/blocks.4/self_attn/Constant_1_output_0%/blocks.4/self_attn/Gather_1_output_0/blocks.4/self_attn/Gather_1"Gather* axis  )/blocks.4/input_layernorm/Cast_2_output_0 onnx::MatMul_8677*/blocks.4/self_attn/q_proj/MatMul_output_0!/blocks.4/self_attn/q_proj/MatMul"MatMul  )/blocks.4/input_layernorm/Cast_2_output_0 onnx::MatMul_8678*/blocks.4/self_attn/k_proj/MatMul_output_0!/blocks.4/self_attn/k_proj/MatMul"MatMul  )/blocks.4/input_layernorm/Cast_2_output_0 onnx::MatMul_8679*/blocks.4/self_attn/v_proj/MatMul_output_0!/blocks.4/self_attn/v_proj/MatMul"MatMul fonnx::Unsqueeze_1534 Constant_3604"Constant*5 value*)BConstant_3604_attr::valueJ  #/blocks.4/self_attn/Gather_output_0 onnx::Unsqueeze_1534&/blocks.4/self_attn/Unsqueeze_output_0/blocks.4/self_attn/Unsqueeze" Unsqueeze fonnx::Unsqueeze_1536 Constant_3606"Constant*5 value*)BConstant_3606_attr::valueJ  %/blocks.4/self_attn/Gather_1_output_0 onnx::Unsqueeze_1536(/blocks.4/self_attn/Unsqueeze_1_output_0/blocks.4/self_attn/Unsqueeze_1" Unsqueeze '/blocks.4/self_attn/Constant_2_output_0/blocks.4/self_attn/Constant_2"Constant*F value*:B*/blocks.4/self_attn/Constant_2_attr::valueJ '/blocks.4/self_attn/Constant_3_output_0/blocks.4/self_attn/Constant_3"Constant*F value*:B*/blocks.4/self_attn/Constant_3_attr::valueJ  &/blocks.4/self_attn/Unsqueeze_output_0 (/blocks.4/self_attn/Unsqueeze_1_output_0 '/blocks.4/self_attn/Constant_2_output_0 '/blocks.4/self_attn/Constant_3_output_0#/blocks.4/self_attn/Concat_output_0/blocks.4/self_attn/Concat"Concat* axis  */blocks.4/self_attn/q_proj/MatMul_output_0 #/blocks.4/self_attn/Concat_output_0$/blocks.4/self_attn/Reshape_output_0/blocks.4/self_attn/Reshape"Reshape* allowzero fonnx::Unsqueeze_1544 Constant_3612"Constant*5 value*)BConstant_3612_attr::valueJ  #/blocks.4/self_attn/Gather_output_0 onnx::Unsqueeze_1544(/blocks.4/self_attn/Unsqueeze_2_output_0/blocks.4/self_attn/Unsqueeze_2" Unsqueeze fonnx::Unsqueeze_1546 Constant_3614"Constant*5 value*)BConstant_3614_attr::valueJ  %/blocks.4/self_attn/Gather_1_output_0 onnx::Unsqueeze_1546(/blocks.4/self_attn/Unsqueeze_3_output_0/blocks.4/self_attn/Unsqueeze_3" Unsqueeze '/blocks.4/self_attn/Constant_4_output_0/blocks.4/self_attn/Constant_4"Constant*F value*:B*/blocks.4/self_attn/Constant_4_attr::valueJ '/blocks.4/self_attn/Constant_5_output_0/blocks.4/self_attn/Constant_5"Constant*F value*:B*/blocks.4/self_attn/Constant_5_attr::valueJ  (/blocks.4/self_attn/Unsqueeze_2_output_0 (/blocks.4/self_attn/Unsqueeze_3_output_0 '/blocks.4/self_attn/Constant_4_output_0 '/blocks.4/self_attn/Constant_5_output_0%/blocks.4/self_attn/Concat_1_output_0/blocks.4/self_attn/Concat_1"Concat* axis fonnx::Unsqueeze_1553 Constant_3619"Constant*5 value*)BConstant_3619_attr::valueJ  #/blocks.4/self_attn/Gather_output_0 onnx::Unsqueeze_1553(/blocks.4/self_attn/Unsqueeze_4_output_0/blocks.4/self_attn/Unsqueeze_4" Unsqueeze fonnx::Unsqueeze_1555 Constant_3621"Constant*5 value*)BConstant_3621_attr::valueJ  %/blocks.4/self_attn/Gather_1_output_0 onnx::Unsqueeze_1555(/blocks.4/self_attn/Unsqueeze_5_output_0/blocks.4/self_attn/Unsqueeze_5" Unsqueeze '/blocks.4/self_attn/Constant_6_output_0/blocks.4/self_attn/Constant_6"Constant*F value*:B*/blocks.4/self_attn/Constant_6_attr::valueJ '/blocks.4/self_attn/Constant_7_output_0/blocks.4/self_attn/Constant_7"Constant*F value*:B*/blocks.4/self_attn/Constant_7_attr::valueJ  (/blocks.4/self_attn/Unsqueeze_4_output_0 (/blocks.4/self_attn/Unsqueeze_5_output_0 '/blocks.4/self_attn/Constant_6_output_0 '/blocks.4/self_attn/Constant_7_output_0%/blocks.4/self_attn/Concat_2_output_0/blocks.4/self_attn/Concat_2"Concat* axis  */blocks.4/self_attn/k_proj/MatMul_output_0 %/blocks.4/self_attn/Concat_1_output_0&/blocks.4/self_attn/Reshape_1_output_0/blocks.4/self_attn/Reshape_1"Reshape* allowzero  */blocks.4/self_attn/v_proj/MatMul_output_0 %/blocks.4/self_attn/Concat_2_output_0&/blocks.4/self_attn/Reshape_2_output_0/blocks.4/self_attn/Reshape_2"Reshape* allowzero  $/blocks.4/self_attn/Reshape_output_0(/blocks.4/self_attn/q_norm/Cast_output_0/blocks.4/self_attn/q_norm/Cast"Cast* to ,/blocks.4/self_attn/q_norm/Constant_output_0#/blocks.4/self_attn/q_norm/Constant"Constant*E value*9B//blocks.4/self_attn/q_norm/Constant_attr::valueJ@  (/blocks.4/self_attn/q_norm/Cast_output_0 ,/blocks.4/self_attn/q_norm/Constant_output_0'/blocks.4/self_attn/q_norm/Pow_output_0/blocks.4/self_attn/q_norm/Pow"Pow  '/blocks.4/self_attn/q_norm/Pow_output_0./blocks.4/self_attn/q_norm/ReduceMean_output_0%/blocks.4/self_attn/q_norm/ReduceMean" ReduceMean* axes@* keepdims ./blocks.4/self_attn/q_norm/Constant_1_output_0%/blocks.4/self_attn/q_norm/Constant_1"Constant*G value*;B1/blocks.4/self_attn/q_norm/Constant_1_attr::valueJ75  ./blocks.4/self_attn/q_norm/ReduceMean_output_0 ./blocks.4/self_attn/q_norm/Constant_1_output_0'/blocks.4/self_attn/q_norm/Add_output_0/blocks.4/self_attn/q_norm/Add"Add z '/blocks.4/self_attn/q_norm/Add_output_0(/blocks.4/self_attn/q_norm/Sqrt_output_0/blocks.4/self_attn/q_norm/Sqrt"Sqrt ./blocks.4/self_attn/q_norm/Constant_2_output_0%/blocks.4/self_attn/q_norm/Constant_2"Constant*G value*;B1/blocks.4/self_attn/q_norm/Constant_2_attr::valueJ?  ./blocks.4/self_attn/q_norm/Constant_2_output_0 (/blocks.4/self_attn/q_norm/Sqrt_output_0'/blocks.4/self_attn/q_norm/Div_output_0/blocks.4/self_attn/q_norm/Div"Div  (/blocks.4/self_attn/q_norm/Cast_output_0*/blocks.4/self_attn/q_norm/Cast_1_output_0!/blocks.4/self_attn/q_norm/Cast_1"Cast* to  */blocks.4/self_attn/q_norm/Cast_1_output_0 '/blocks.4/self_attn/q_norm/Div_output_0'/blocks.4/self_attn/q_norm/Mul_output_0/blocks.4/self_attn/q_norm/Mul"Mul  '/blocks.4/self_attn/q_norm/Mul_output_0 blocks.4.self_attn.q_norm.weight)/blocks.4/self_attn/q_norm/Mul_1_output_0 /blocks.4/self_attn/q_norm/Mul_1"Mul  )/blocks.4/self_attn/q_norm/Mul_1_output_0*/blocks.4/self_attn/q_norm/Cast_2_output_0!/blocks.4/self_attn/q_norm/Cast_2"Cast* to  &/blocks.4/self_attn/Reshape_1_output_0(/blocks.4/self_attn/k_norm/Cast_output_0/blocks.4/self_attn/k_norm/Cast"Cast* to ,/blocks.4/self_attn/k_norm/Constant_output_0#/blocks.4/self_attn/k_norm/Constant"Constant*E value*9B//blocks.4/self_attn/k_norm/Constant_attr::valueJ@  (/blocks.4/self_attn/k_norm/Cast_output_0 ,/blocks.4/self_attn/k_norm/Constant_output_0'/blocks.4/self_attn/k_norm/Pow_output_0/blocks.4/self_attn/k_norm/Pow"Pow  '/blocks.4/self_attn/k_norm/Pow_output_0./blocks.4/self_attn/k_norm/ReduceMean_output_0%/blocks.4/self_attn/k_norm/ReduceMean" ReduceMean* axes@* keepdims ./blocks.4/self_attn/k_norm/Constant_1_output_0%/blocks.4/self_attn/k_norm/Constant_1"Constant*G value*;B1/blocks.4/self_attn/k_norm/Constant_1_attr::valueJ75  ./blocks.4/self_attn/k_norm/ReduceMean_output_0 ./blocks.4/self_attn/k_norm/Constant_1_output_0'/blocks.4/self_attn/k_norm/Add_output_0/blocks.4/self_attn/k_norm/Add"Add z '/blocks.4/self_attn/k_norm/Add_output_0(/blocks.4/self_attn/k_norm/Sqrt_output_0/blocks.4/self_attn/k_norm/Sqrt"Sqrt ./blocks.4/self_attn/k_norm/Constant_2_output_0%/blocks.4/self_attn/k_norm/Constant_2"Constant*G value*;B1/blocks.4/self_attn/k_norm/Constant_2_attr::valueJ?  ./blocks.4/self_attn/k_norm/Constant_2_output_0 (/blocks.4/self_attn/k_norm/Sqrt_output_0'/blocks.4/self_attn/k_norm/Div_output_0/blocks.4/self_attn/k_norm/Div"Div  (/blocks.4/self_attn/k_norm/Cast_output_0*/blocks.4/self_attn/k_norm/Cast_1_output_0!/blocks.4/self_attn/k_norm/Cast_1"Cast* to  */blocks.4/self_attn/k_norm/Cast_1_output_0 '/blocks.4/self_attn/k_norm/Div_output_0'/blocks.4/self_attn/k_norm/Mul_output_0/blocks.4/self_attn/k_norm/Mul"Mul  '/blocks.4/self_attn/k_norm/Mul_output_0 blocks.4.self_attn.k_norm.weight)/blocks.4/self_attn/k_norm/Mul_1_output_0 /blocks.4/self_attn/k_norm/Mul_1"Mul  )/blocks.4/self_attn/k_norm/Mul_1_output_0*/blocks.4/self_attn/k_norm/Cast_2_output_0!/blocks.4/self_attn/k_norm/Cast_2"Cast* to  */blocks.4/self_attn/q_norm/Cast_2_output_0 %/blocks.0/self_attn/Gather_2_output_0 /blocks.4/self_attn/Mul_output_0/blocks.4/self_attn/Mul"Mul v */blocks.4/self_attn/q_norm/Cast_2_output_0$/blocks.4/self_attn/Shape_2_output_0/blocks.4/self_attn/Shape_2"Shape '/blocks.4/self_attn/Constant_8_output_0/blocks.4/self_attn/Constant_8"Constant*D value*8B*/blocks.4/self_attn/Constant_8_attr::valueJ  $/blocks.4/self_attn/Shape_2_output_0 '/blocks.4/self_attn/Constant_8_output_0%/blocks.4/self_attn/Gather_2_output_0/blocks.4/self_attn/Gather_2"Gather* axis '/blocks.4/self_attn/Constant_9_output_0/blocks.4/self_attn/Constant_9"Constant*D value*8B*/blocks.4/self_attn/Constant_9_attr::valueJ  %/blocks.4/self_attn/Gather_2_output_0 '/blocks.4/self_attn/Constant_9_output_0 /blocks.4/self_attn/Div_output_0/blocks.4/self_attn/Div"Div p /blocks.4/self_attn/Div_output_0!/blocks.4/self_attn/Cast_output_0/blocks.4/self_attn/Cast"Cast* to u !/blocks.4/self_attn/Cast_output_0#/blocks.4/self_attn/Cast_1_output_0/blocks.4/self_attn/Cast_1"Cast* to (/blocks.4/self_attn/Constant_10_output_0/blocks.4/self_attn/Constant_10"Constant*G value*;B+/blocks.4/self_attn/Constant_10_attr::valueJ (/blocks.4/self_attn/Constant_11_output_0/blocks.4/self_attn/Constant_11"Constant*G value*;B+/blocks.4/self_attn/Constant_11_attr::valueJ (/blocks.4/self_attn/Constant_12_output_0/blocks.4/self_attn/Constant_12"Constant*G value*;B+/blocks.4/self_attn/Constant_12_attr::valueJ  #/blocks.4/self_attn/Cast_1_output_0 (/blocks.4/self_attn/Constant_12_output_0(/blocks.4/self_attn/Unsqueeze_6_output_0/blocks.4/self_attn/Unsqueeze_6" Unsqueeze (/blocks.4/self_attn/Constant_13_output_0/blocks.4/self_attn/Constant_13"Constant*G value*;B+/blocks.4/self_attn/Constant_13_attr::valueJ  */blocks.4/self_attn/q_norm/Cast_2_output_0 (/blocks.4/self_attn/Constant_11_output_0 (/blocks.4/self_attn/Unsqueeze_6_output_0 (/blocks.4/self_attn/Constant_10_output_0 (/blocks.4/self_attn/Constant_13_output_0"/blocks.4/self_attn/Slice_output_0/blocks.4/self_attn/Slice"Slice (/blocks.4/self_attn/Constant_14_output_0/blocks.4/self_attn/Constant_14"Constant*G value*;B+/blocks.4/self_attn/Constant_14_attr::valueJ (/blocks.4/self_attn/Constant_15_output_0/blocks.4/self_attn/Constant_15"Constant*G value*;B+/blocks.4/self_attn/Constant_15_attr::valueJ  #/blocks.4/self_attn/Cast_1_output_0 (/blocks.4/self_attn/Constant_15_output_0(/blocks.4/self_attn/Unsqueeze_7_output_0/blocks.4/self_attn/Unsqueeze_7" Unsqueeze (/blocks.4/self_attn/Constant_16_output_0/blocks.4/self_attn/Constant_16"Constant*G value*;B+/blocks.4/self_attn/Constant_16_attr::valueJ (/blocks.4/self_attn/Constant_17_output_0/blocks.4/self_attn/Constant_17"Constant*G value*;B+/blocks.4/self_attn/Constant_17_attr::valueJ  */blocks.4/self_attn/q_norm/Cast_2_output_0 (/blocks.4/self_attn/Unsqueeze_7_output_0 (/blocks.4/self_attn/Constant_16_output_0 (/blocks.4/self_attn/Constant_14_output_0 (/blocks.4/self_attn/Constant_17_output_0$/blocks.4/self_attn/Slice_1_output_0/blocks.4/self_attn/Slice_1"Slice f $/blocks.4/self_attn/Slice_1_output_0 /blocks.4/self_attn/Neg_output_0/blocks.4/self_attn/Neg"Neg  /blocks.4/self_attn/Neg_output_0 "/blocks.4/self_attn/Slice_output_0%/blocks.4/self_attn/Concat_3_output_0/blocks.4/self_attn/Concat_3"Concat* axis  %/blocks.4/self_attn/Concat_3_output_0 %/blocks.0/self_attn/Gather_3_output_0"/blocks.4/self_attn/Mul_1_output_0/blocks.4/self_attn/Mul_1"Mul  /blocks.4/self_attn/Mul_output_0 "/blocks.4/self_attn/Mul_1_output_0 /blocks.4/self_attn/Add_output_0/blocks.4/self_attn/Add"Add  */blocks.4/self_attn/k_norm/Cast_2_output_0 %/blocks.0/self_attn/Gather_2_output_0"/blocks.4/self_attn/Mul_2_output_0/blocks.4/self_attn/Mul_2"Mul v */blocks.4/self_attn/k_norm/Cast_2_output_0$/blocks.4/self_attn/Shape_3_output_0/blocks.4/self_attn/Shape_3"Shape (/blocks.4/self_attn/Constant_18_output_0/blocks.4/self_attn/Constant_18"Constant*E value*9B+/blocks.4/self_attn/Constant_18_attr::valueJ  $/blocks.4/self_attn/Shape_3_output_0 (/blocks.4/self_attn/Constant_18_output_0%/blocks.4/self_attn/Gather_3_output_0/blocks.4/self_attn/Gather_3"Gather* axis (/blocks.4/self_attn/Constant_19_output_0/blocks.4/self_attn/Constant_19"Constant*E value*9B+/blocks.4/self_attn/Constant_19_attr::valueJ  %/blocks.4/self_attn/Gather_3_output_0 (/blocks.4/self_attn/Constant_19_output_0"/blocks.4/self_attn/Div_1_output_0/blocks.4/self_attn/Div_1"Div v "/blocks.4/self_attn/Div_1_output_0#/blocks.4/self_attn/Cast_2_output_0/blocks.4/self_attn/Cast_2"Cast* to w #/blocks.4/self_attn/Cast_2_output_0#/blocks.4/self_attn/Cast_3_output_0/blocks.4/self_attn/Cast_3"Cast* to (/blocks.4/self_attn/Constant_20_output_0/blocks.4/self_attn/Constant_20"Constant*G value*;B+/blocks.4/self_attn/Constant_20_attr::valueJ (/blocks.4/self_attn/Constant_21_output_0/blocks.4/self_attn/Constant_21"Constant*G value*;B+/blocks.4/self_attn/Constant_21_attr::valueJ (/blocks.4/self_attn/Constant_22_output_0/blocks.4/self_attn/Constant_22"Constant*G value*;B+/blocks.4/self_attn/Constant_22_attr::valueJ  #/blocks.4/self_attn/Cast_3_output_0 (/blocks.4/self_attn/Constant_22_output_0(/blocks.4/self_attn/Unsqueeze_8_output_0/blocks.4/self_attn/Unsqueeze_8" Unsqueeze (/blocks.4/self_attn/Constant_23_output_0/blocks.4/self_attn/Constant_23"Constant*G value*;B+/blocks.4/self_attn/Constant_23_attr::valueJ  */blocks.4/self_attn/k_norm/Cast_2_output_0 (/blocks.4/self_attn/Constant_21_output_0 (/blocks.4/self_attn/Unsqueeze_8_output_0 (/blocks.4/self_attn/Constant_20_output_0 (/blocks.4/self_attn/Constant_23_output_0$/blocks.4/self_attn/Slice_2_output_0/blocks.4/self_attn/Slice_2"Slice (/blocks.4/self_attn/Constant_24_output_0/blocks.4/self_attn/Constant_24"Constant*G value*;B+/blocks.4/self_attn/Constant_24_attr::valueJ (/blocks.4/self_attn/Constant_25_output_0/blocks.4/self_attn/Constant_25"Constant*G value*;B+/blocks.4/self_attn/Constant_25_attr::valueJ  #/blocks.4/self_attn/Cast_3_output_0 (/blocks.4/self_attn/Constant_25_output_0(/blocks.4/self_attn/Unsqueeze_9_output_0/blocks.4/self_attn/Unsqueeze_9" Unsqueeze (/blocks.4/self_attn/Constant_26_output_0/blocks.4/self_attn/Constant_26"Constant*G value*;B+/blocks.4/self_attn/Constant_26_attr::valueJ (/blocks.4/self_attn/Constant_27_output_0/blocks.4/self_attn/Constant_27"Constant*G value*;B+/blocks.4/self_attn/Constant_27_attr::valueJ  */blocks.4/self_attn/k_norm/Cast_2_output_0 (/blocks.4/self_attn/Unsqueeze_9_output_0 (/blocks.4/self_attn/Constant_26_output_0 (/blocks.4/self_attn/Constant_24_output_0 (/blocks.4/self_attn/Constant_27_output_0$/blocks.4/self_attn/Slice_3_output_0/blocks.4/self_attn/Slice_3"Slice j $/blocks.4/self_attn/Slice_3_output_0"/blocks.4/self_attn/Neg_1_output_0/blocks.4/self_attn/Neg_1"Neg  "/blocks.4/self_attn/Neg_1_output_0 $/blocks.4/self_attn/Slice_2_output_0%/blocks.4/self_attn/Concat_4_output_0/blocks.4/self_attn/Concat_4"Concat* axis  %/blocks.4/self_attn/Concat_4_output_0 %/blocks.0/self_attn/Gather_3_output_0"/blocks.4/self_attn/Mul_3_output_0/blocks.4/self_attn/Mul_3"Mul  "/blocks.4/self_attn/Mul_2_output_0 "/blocks.4/self_attn/Mul_3_output_0"/blocks.4/self_attn/Add_1_output_0/blocks.4/self_attn/Add_1"Add  /Gather_4_output_0 /rotary/Constant_3_output_0%/blocks.4/self_attn/Gather_4_output_0/blocks.4/self_attn/Gather_4"Gather* axis  /Gather_4_output_0 /rotary/Constant_8_output_0%/blocks.4/self_attn/Gather_5_output_0/blocks.4/self_attn/Gather_5"Gather* axis  %/blocks.4/self_attn/Gather_4_output_0 "/blocks.4/self_attn/Add_1_output_0%/blocks.4/self_attn/Concat_5_output_0/blocks.4/self_attn/Concat_5"Concat* axis  %/blocks.4/self_attn/Gather_5_output_0 &/blocks.4/self_attn/Reshape_2_output_0%/blocks.4/self_attn/Concat_6_output_0/blocks.4/self_attn/Concat_6"Concat* axis (/blocks.4/self_attn/Constant_28_output_0/blocks.4/self_attn/Constant_28"Constant*G value*;B+/blocks.4/self_attn/Constant_28_attr::valueJ  %/blocks.4/self_attn/Concat_5_output_0 (/blocks.4/self_attn/Constant_28_output_0)/blocks.4/self_attn/Unsqueeze_10_output_0 /blocks.4/self_attn/Unsqueeze_10" Unsqueeze (/blocks.4/self_attn/Constant_29_output_0/blocks.4/self_attn/Constant_29"Constant*G value*;B+/blocks.4/self_attn/Constant_29_attr::valueJ  %/blocks.4/self_attn/Concat_6_output_0 (/blocks.4/self_attn/Constant_29_output_0)/blocks.4/self_attn/Unsqueeze_11_output_0 /blocks.4/self_attn/Unsqueeze_11" Unsqueeze  )/blocks.4/self_attn/Unsqueeze_10_output_0 )/blocks.4/self_attn/Unsqueeze_11_output_0%/blocks.4/self_attn/Concat_7_output_0/blocks.4/self_attn/Concat_7"Concat* axis  /blocks.4/self_attn/Add_output_0&/blocks.4/self_attn/Transpose_output_0/blocks.4/self_attn/Transpose" Transpose* perm@@@@  %/blocks.4/self_attn/Concat_5_output_0(/blocks.4/self_attn/Transpose_1_output_0/blocks.4/self_attn/Transpose_1" Transpose* perm@@@@  %/blocks.4/self_attn/Concat_6_output_0(/blocks.4/self_attn/Transpose_2_output_0/blocks.4/self_attn/Transpose_2" Transpose* perm@@@@ t (/blocks.4/self_attn/Transpose_1_output_0$/blocks.4/self_attn/Shape_4_output_0/blocks.4/self_attn/Shape_4"Shape (/blocks.4/self_attn/Constant_30_output_0/blocks.4/self_attn/Constant_30"Constant*E value*9B+/blocks.4/self_attn/Constant_30_attr::valueJ  $/blocks.4/self_attn/Shape_4_output_0 (/blocks.4/self_attn/Constant_30_output_0%/blocks.4/self_attn/Gather_6_output_0/blocks.4/self_attn/Gather_6"Gather* axis t (/blocks.4/self_attn/Transpose_1_output_0$/blocks.4/self_attn/Shape_5_output_0/blocks.4/self_attn/Shape_5"Shape (/blocks.4/self_attn/Constant_31_output_0/blocks.4/self_attn/Constant_31"Constant*E value*9B+/blocks.4/self_attn/Constant_31_attr::valueJ  $/blocks.4/self_attn/Shape_5_output_0 (/blocks.4/self_attn/Constant_31_output_0%/blocks.4/self_attn/Gather_7_output_0/blocks.4/self_attn/Gather_7"Gather* axis t (/blocks.4/self_attn/Transpose_1_output_0$/blocks.4/self_attn/Shape_6_output_0/blocks.4/self_attn/Shape_6"Shape (/blocks.4/self_attn/Constant_32_output_0/blocks.4/self_attn/Constant_32"Constant*E value*9B+/blocks.4/self_attn/Constant_32_attr::valueJ  $/blocks.4/self_attn/Shape_6_output_0 (/blocks.4/self_attn/Constant_32_output_0%/blocks.4/self_attn/Gather_8_output_0/blocks.4/self_attn/Gather_8"Gather* axis t (/blocks.4/self_attn/Transpose_1_output_0$/blocks.4/self_attn/Shape_7_output_0/blocks.4/self_attn/Shape_7"Shape (/blocks.4/self_attn/Constant_33_output_0/blocks.4/self_attn/Constant_33"Constant*E value*9B+/blocks.4/self_attn/Constant_33_attr::valueJ  $/blocks.4/self_attn/Shape_7_output_0 (/blocks.4/self_attn/Constant_33_output_0%/blocks.4/self_attn/Gather_9_output_0/blocks.4/self_attn/Gather_9"Gather* axis (/blocks.4/self_attn/Constant_34_output_0/blocks.4/self_attn/Constant_34"Constant*G value*;B+/blocks.4/self_attn/Constant_34_attr::valueJ  (/blocks.4/self_attn/Transpose_1_output_0 (/blocks.4/self_attn/Constant_34_output_0)/blocks.4/self_attn/Unsqueeze_12_output_0 /blocks.4/self_attn/Unsqueeze_12" Unsqueeze (/blocks.4/self_attn/Constant_35_output_0/blocks.4/self_attn/Constant_35"Constant*G value*;B+/blocks.4/self_attn/Constant_35_attr::valueJ  %/blocks.4/self_attn/Gather_6_output_0 (/blocks.4/self_attn/Constant_35_output_0)/blocks.4/self_attn/Unsqueeze_13_output_0 /blocks.4/self_attn/Unsqueeze_13" Unsqueeze (/blocks.4/self_attn/Constant_36_output_0/blocks.4/self_attn/Constant_36"Constant*G value*;B+/blocks.4/self_attn/Constant_36_attr::valueJ  %/blocks.4/self_attn/Gather_7_output_0 (/blocks.4/self_attn/Constant_36_output_0)/blocks.4/self_attn/Unsqueeze_14_output_0 /blocks.4/self_attn/Unsqueeze_14" Unsqueeze (/blocks.4/self_attn/Constant_37_output_0/blocks.4/self_attn/Constant_37"Constant*G value*;B+/blocks.4/self_attn/Constant_37_attr::valueJ (/blocks.4/self_attn/Constant_38_output_0/blocks.4/self_attn/Constant_38"Constant*G value*;B+/blocks.4/self_attn/Constant_38_attr::valueJ  %/blocks.4/self_attn/Gather_8_output_0 (/blocks.4/self_attn/Constant_38_output_0)/blocks.4/self_attn/Unsqueeze_15_output_0 /blocks.4/self_attn/Unsqueeze_15" Unsqueeze (/blocks.4/self_attn/Constant_39_output_0/blocks.4/self_attn/Constant_39"Constant*G value*;B+/blocks.4/self_attn/Constant_39_attr::valueJ  %/blocks.4/self_attn/Gather_9_output_0 (/blocks.4/self_attn/Constant_39_output_0)/blocks.4/self_attn/Unsqueeze_16_output_0 /blocks.4/self_attn/Unsqueeze_16" Unsqueeze  )/blocks.4/self_attn/Unsqueeze_13_output_0 )/blocks.4/self_attn/Unsqueeze_14_output_0 (/blocks.4/self_attn/Constant_37_output_0 )/blocks.4/self_attn/Unsqueeze_15_output_0 )/blocks.4/self_attn/Unsqueeze_16_output_0%/blocks.4/self_attn/Concat_8_output_0/blocks.4/self_attn/Concat_8"Concat* axis (/blocks.4/self_attn/Constant_40_output_0/blocks.4/self_attn/Constant_40"Constant*G value*;B+/blocks.4/self_attn/Constant_40_attr::valueJ  %/blocks.4/self_attn/Concat_8_output_0 (/blocks.4/self_attn/Constant_40_output_0&/blocks.4/self_attn/Reshape_3_output_0/blocks.4/self_attn/Reshape_3"Reshape* allowzero r &/blocks.4/self_attn/Reshape_3_output_0$/blocks.4/self_attn/Shape_8_output_0/blocks.4/self_attn/Shape_8"Shape  $/blocks.4/self_attn/Shape_8_output_0,/blocks.4/self_attn/ConstantOfShape_output_0#/blocks.4/self_attn/ConstantOfShape"ConstantOfShape*K value*?B//blocks.4/self_attn/ConstantOfShape_attr::valueJ (/blocks.4/self_attn/Constant_41_output_0/blocks.4/self_attn/Constant_41"Constant*E value*9B+/blocks.4/self_attn/Constant_41_attr::valueJ  ,/blocks.4/self_attn/ConstantOfShape_output_0 (/blocks.4/self_attn/Constant_41_output_0"/blocks.4/self_attn/Mul_4_output_0/blocks.4/self_attn/Mul_4"Mul  &/blocks.4/self_attn/Reshape_3_output_0 "/blocks.4/self_attn/Mul_4_output_0"/blocks.4/self_attn/Equal_output_0/blocks.4/self_attn/Equal"Equal  "/blocks.4/self_attn/Equal_output_0 ,/blocks.4/self_attn/ConstantOfShape_output_0 &/blocks.4/self_attn/Reshape_3_output_0"/blocks.4/self_attn/Where_output_0/blocks.4/self_attn/Where"Where  )/blocks.4/self_attn/Unsqueeze_12_output_0 "/blocks.4/self_attn/Where_output_0#/blocks.4/self_attn/Expand_output_0/blocks.4/self_attn/Expand"Expand (/blocks.4/self_attn/Constant_42_output_0/blocks.4/self_attn/Constant_42"Constant*E value*9B+/blocks.4/self_attn/Constant_42_attr::valueJ  %/blocks.4/self_attn/Gather_7_output_0 (/blocks.4/self_attn/Constant_42_output_0"/blocks.4/self_attn/Mul_5_output_0/blocks.4/self_attn/Mul_5"Mul fonnx::Unsqueeze_1698 Constant_3749"Constant*5 value*)BConstant_3749_attr::valueJ  %/blocks.4/self_attn/Gather_6_output_0 onnx::Unsqueeze_1698)/blocks.4/self_attn/Unsqueeze_17_output_0 /blocks.4/self_attn/Unsqueeze_17" Unsqueeze fonnx::Unsqueeze_1700 Constant_3751"Constant*5 value*)BConstant_3751_attr::valueJ  "/blocks.4/self_attn/Mul_5_output_0 onnx::Unsqueeze_1700)/blocks.4/self_attn/Unsqueeze_18_output_0 /blocks.4/self_attn/Unsqueeze_18" Unsqueeze fonnx::Unsqueeze_1702 Constant_3753"Constant*5 value*)BConstant_3753_attr::valueJ  %/blocks.4/self_attn/Gather_8_output_0 onnx::Unsqueeze_1702)/blocks.4/self_attn/Unsqueeze_19_output_0 /blocks.4/self_attn/Unsqueeze_19" Unsqueeze fonnx::Unsqueeze_1704 Constant_3755"Constant*5 value*)BConstant_3755_attr::valueJ  %/blocks.4/self_attn/Gather_9_output_0 onnx::Unsqueeze_1704)/blocks.4/self_attn/Unsqueeze_20_output_0 /blocks.4/self_attn/Unsqueeze_20" Unsqueeze  )/blocks.4/self_attn/Unsqueeze_17_output_0 )/blocks.4/self_attn/Unsqueeze_18_output_0 )/blocks.4/self_attn/Unsqueeze_19_output_0 )/blocks.4/self_attn/Unsqueeze_20_output_0%/blocks.4/self_attn/Concat_9_output_0/blocks.4/self_attn/Concat_9"Concat* axis  #/blocks.4/self_attn/Expand_output_0 %/blocks.4/self_attn/Concat_9_output_0&/blocks.4/self_attn/Reshape_4_output_0/blocks.4/self_attn/Reshape_4"Reshape* allowzero t (/blocks.4/self_attn/Transpose_2_output_0$/blocks.4/self_attn/Shape_9_output_0/blocks.4/self_attn/Shape_9"Shape (/blocks.4/self_attn/Constant_43_output_0/blocks.4/self_attn/Constant_43"Constant*E value*9B+/blocks.4/self_attn/Constant_43_attr::valueJ  $/blocks.4/self_attn/Shape_9_output_0 (/blocks.4/self_attn/Constant_43_output_0&/blocks.4/self_attn/Gather_10_output_0/blocks.4/self_attn/Gather_10"Gather* axis v (/blocks.4/self_attn/Transpose_2_output_0%/blocks.4/self_attn/Shape_10_output_0/blocks.4/self_attn/Shape_10"Shape (/blocks.4/self_attn/Constant_44_output_0/blocks.4/self_attn/Constant_44"Constant*E value*9B+/blocks.4/self_attn/Constant_44_attr::valueJ  %/blocks.4/self_attn/Shape_10_output_0 (/blocks.4/self_attn/Constant_44_output_0&/blocks.4/self_attn/Gather_11_output_0/blocks.4/self_attn/Gather_11"Gather* axis v (/blocks.4/self_attn/Transpose_2_output_0%/blocks.4/self_attn/Shape_11_output_0/blocks.4/self_attn/Shape_11"Shape (/blocks.4/self_attn/Constant_45_output_0/blocks.4/self_attn/Constant_45"Constant*E value*9B+/blocks.4/self_attn/Constant_45_attr::valueJ  %/blocks.4/self_attn/Shape_11_output_0 (/blocks.4/self_attn/Constant_45_output_0&/blocks.4/self_attn/Gather_12_output_0/blocks.4/self_attn/Gather_12"Gather* axis v (/blocks.4/self_attn/Transpose_2_output_0%/blocks.4/self_attn/Shape_12_output_0/blocks.4/self_attn/Shape_12"Shape (/blocks.4/self_attn/Constant_46_output_0/blocks.4/self_attn/Constant_46"Constant*E value*9B+/blocks.4/self_attn/Constant_46_attr::valueJ  %/blocks.4/self_attn/Shape_12_output_0 (/blocks.4/self_attn/Constant_46_output_0&/blocks.4/self_attn/Gather_13_output_0/blocks.4/self_attn/Gather_13"Gather* axis (/blocks.4/self_attn/Constant_47_output_0/blocks.4/self_attn/Constant_47"Constant*G value*;B+/blocks.4/self_attn/Constant_47_attr::valueJ  (/blocks.4/self_attn/Transpose_2_output_0 (/blocks.4/self_attn/Constant_47_output_0)/blocks.4/self_attn/Unsqueeze_21_output_0 /blocks.4/self_attn/Unsqueeze_21" Unsqueeze (/blocks.4/self_attn/Constant_48_output_0/blocks.4/self_attn/Constant_48"Constant*G value*;B+/blocks.4/self_attn/Constant_48_attr::valueJ  &/blocks.4/self_attn/Gather_10_output_0 (/blocks.4/self_attn/Constant_48_output_0)/blocks.4/self_attn/Unsqueeze_22_output_0 /blocks.4/self_attn/Unsqueeze_22" Unsqueeze (/blocks.4/self_attn/Constant_49_output_0/blocks.4/self_attn/Constant_49"Constant*G value*;B+/blocks.4/self_attn/Constant_49_attr::valueJ  &/blocks.4/self_attn/Gather_11_output_0 (/blocks.4/self_attn/Constant_49_output_0)/blocks.4/self_attn/Unsqueeze_23_output_0 /blocks.4/self_attn/Unsqueeze_23" Unsqueeze (/blocks.4/self_attn/Constant_50_output_0/blocks.4/self_attn/Constant_50"Constant*G value*;B+/blocks.4/self_attn/Constant_50_attr::valueJ (/blocks.4/self_attn/Constant_51_output_0/blocks.4/self_attn/Constant_51"Constant*G value*;B+/blocks.4/self_attn/Constant_51_attr::valueJ  &/blocks.4/self_attn/Gather_12_output_0 (/blocks.4/self_attn/Constant_51_output_0)/blocks.4/self_attn/Unsqueeze_24_output_0 /blocks.4/self_attn/Unsqueeze_24" Unsqueeze (/blocks.4/self_attn/Constant_52_output_0/blocks.4/self_attn/Constant_52"Constant*G value*;B+/blocks.4/self_attn/Constant_52_attr::valueJ  &/blocks.4/self_attn/Gather_13_output_0 (/blocks.4/self_attn/Constant_52_output_0)/blocks.4/self_attn/Unsqueeze_25_output_0 /blocks.4/self_attn/Unsqueeze_25" Unsqueeze  )/blocks.4/self_attn/Unsqueeze_22_output_0 )/blocks.4/self_attn/Unsqueeze_23_output_0 (/blocks.4/self_attn/Constant_50_output_0 )/blocks.4/self_attn/Unsqueeze_24_output_0 )/blocks.4/self_attn/Unsqueeze_25_output_0&/blocks.4/self_attn/Concat_10_output_0/blocks.4/self_attn/Concat_10"Concat* axis (/blocks.4/self_attn/Constant_53_output_0/blocks.4/self_attn/Constant_53"Constant*G value*;B+/blocks.4/self_attn/Constant_53_attr::valueJ  &/blocks.4/self_attn/Concat_10_output_0 (/blocks.4/self_attn/Constant_53_output_0&/blocks.4/self_attn/Reshape_5_output_0/blocks.4/self_attn/Reshape_5"Reshape* allowzero t &/blocks.4/self_attn/Reshape_5_output_0%/blocks.4/self_attn/Shape_13_output_0/blocks.4/self_attn/Shape_13"Shape  %/blocks.4/self_attn/Shape_13_output_0./blocks.4/self_attn/ConstantOfShape_1_output_0%/blocks.4/self_attn/ConstantOfShape_1"ConstantOfShape*M value*AB1/blocks.4/self_attn/ConstantOfShape_1_attr::valueJ (/blocks.4/self_attn/Constant_54_output_0/blocks.4/self_attn/Constant_54"Constant*E value*9B+/blocks.4/self_attn/Constant_54_attr::valueJ  ./blocks.4/self_attn/ConstantOfShape_1_output_0 (/blocks.4/self_attn/Constant_54_output_0"/blocks.4/self_attn/Mul_6_output_0/blocks.4/self_attn/Mul_6"Mul  &/blocks.4/self_attn/Reshape_5_output_0 "/blocks.4/self_attn/Mul_6_output_0$/blocks.4/self_attn/Equal_1_output_0/blocks.4/self_attn/Equal_1"Equal  $/blocks.4/self_attn/Equal_1_output_0 ./blocks.4/self_attn/ConstantOfShape_1_output_0 &/blocks.4/self_attn/Reshape_5_output_0$/blocks.4/self_attn/Where_1_output_0/blocks.4/self_attn/Where_1"Where  )/blocks.4/self_attn/Unsqueeze_21_output_0 $/blocks.4/self_attn/Where_1_output_0%/blocks.4/self_attn/Expand_1_output_0/blocks.4/self_attn/Expand_1"Expand (/blocks.4/self_attn/Constant_55_output_0/blocks.4/self_attn/Constant_55"Constant*E value*9B+/blocks.4/self_attn/Constant_55_attr::valueJ  &/blocks.4/self_attn/Gather_11_output_0 (/blocks.4/self_attn/Constant_55_output_0"/blocks.4/self_attn/Mul_7_output_0/blocks.4/self_attn/Mul_7"Mul fonnx::Unsqueeze_1744 Constant_3794"Constant*5 value*)BConstant_3794_attr::valueJ  &/blocks.4/self_attn/Gather_10_output_0 onnx::Unsqueeze_1744)/blocks.4/self_attn/Unsqueeze_26_output_0 /blocks.4/self_attn/Unsqueeze_26" Unsqueeze fonnx::Unsqueeze_1746 Constant_3796"Constant*5 value*)BConstant_3796_attr::valueJ  "/blocks.4/self_attn/Mul_7_output_0 onnx::Unsqueeze_1746)/blocks.4/self_attn/Unsqueeze_27_output_0 /blocks.4/self_attn/Unsqueeze_27" Unsqueeze fonnx::Unsqueeze_1748 Constant_3798"Constant*5 value*)BConstant_3798_attr::valueJ  &/blocks.4/self_attn/Gather_12_output_0 onnx::Unsqueeze_1748)/blocks.4/self_attn/Unsqueeze_28_output_0 /blocks.4/self_attn/Unsqueeze_28" Unsqueeze fonnx::Unsqueeze_1750 Constant_3800"Constant*5 value*)BConstant_3800_attr::valueJ  &/blocks.4/self_attn/Gather_13_output_0 onnx::Unsqueeze_1750)/blocks.4/self_attn/Unsqueeze_29_output_0 /blocks.4/self_attn/Unsqueeze_29" Unsqueeze  )/blocks.4/self_attn/Unsqueeze_26_output_0 )/blocks.4/self_attn/Unsqueeze_27_output_0 )/blocks.4/self_attn/Unsqueeze_28_output_0 )/blocks.4/self_attn/Unsqueeze_29_output_0&/blocks.4/self_attn/Concat_11_output_0/blocks.4/self_attn/Concat_11"Concat* axis  %/blocks.4/self_attn/Expand_1_output_0 &/blocks.4/self_attn/Concat_11_output_0&/blocks.4/self_attn/Reshape_6_output_0/blocks.4/self_attn/Reshape_6"Reshape* allowzero  &/blocks.4/self_attn/Transpose_output_0 &/blocks.4/self_attn/Reshape_4_output_0#/blocks.4/self_attn/MatMul_output_0/blocks.4/self_attn/MatMul"MatMul (/blocks.4/self_attn/Constant_56_output_0/blocks.4/self_attn/Constant_56"Constant*A value*5B+/blocks.4/self_attn/Constant_56_attr::valueJ5A  #/blocks.4/self_attn/MatMul_output_0 (/blocks.4/self_attn/Constant_56_output_0"/blocks.4/self_attn/Div_2_output_0/blocks.4/self_attn/Div_2"Div x "/blocks.4/self_attn/Div_2_output_0 attention_mask"/blocks.4/self_attn/Add_2_output_0/blocks.4/self_attn/Add_2"Add  "/blocks.4/self_attn/Add_2_output_0$/blocks.4/self_attn/Softmax_output_0/blocks.4/self_attn/Softmax"Softmax* axis x $/blocks.4/self_attn/Softmax_output_0#/blocks.4/self_attn/Cast_4_output_0/blocks.4/self_attn/Cast_4"Cast* to  #/blocks.4/self_attn/Cast_4_output_0 &/blocks.4/self_attn/Reshape_6_output_0%/blocks.4/self_attn/MatMul_1_output_0/blocks.4/self_attn/MatMul_1"MatMul  %/blocks.4/self_attn/MatMul_1_output_0(/blocks.4/self_attn/Transpose_3_output_0/blocks.4/self_attn/Transpose_3" Transpose* perm@@@@ fonnx::Unsqueeze_1762 Constant_3812"Constant*5 value*)BConstant_3812_attr::valueJ  #/blocks.4/self_attn/Gather_output_0 onnx::Unsqueeze_1762)/blocks.4/self_attn/Unsqueeze_30_output_0 /blocks.4/self_attn/Unsqueeze_30" Unsqueeze fonnx::Unsqueeze_1764 Constant_3814"Constant*5 value*)BConstant_3814_attr::valueJ  %/blocks.4/self_attn/Gather_1_output_0 onnx::Unsqueeze_1764)/blocks.4/self_attn/Unsqueeze_31_output_0 /blocks.4/self_attn/Unsqueeze_31" Unsqueeze (/blocks.4/self_attn/Constant_57_output_0/blocks.4/self_attn/Constant_57"Constant*G value*;B+/blocks.4/self_attn/Constant_57_attr::valueJ  )/blocks.4/self_attn/Unsqueeze_30_output_0 )/blocks.4/self_attn/Unsqueeze_31_output_0 (/blocks.4/self_attn/Constant_57_output_0&/blocks.4/self_attn/Concat_12_output_0/blocks.4/self_attn/Concat_12"Concat* axis  (/blocks.4/self_attn/Transpose_3_output_0 &/blocks.4/self_attn/Concat_12_output_0&/blocks.4/self_attn/Reshape_7_output_0/blocks.4/self_attn/Reshape_7"Reshape* allowzero  &/blocks.4/self_attn/Reshape_7_output_0 onnx::MatMul_8701*/blocks.4/self_attn/o_proj/MatMul_output_0!/blocks.4/self_attn/o_proj/MatMul"MatMul  )/blocks.4/input_layernorm/Cast_1_output_0 */blocks.4/self_attn/o_proj/MatMul_output_0/blocks.4/Add_output_0 /blocks.4/Add"Add  /blocks.4/Add_output_00/blocks.4/post_attention_layernorm/Cast_output_0'/blocks.4/post_attention_layernorm/Cast"Cast* to 4/blocks.4/post_attention_layernorm/Constant_output_0+/blocks.4/post_attention_layernorm/Constant"Constant*M value*AB7/blocks.4/post_attention_layernorm/Constant_attr::valueJ@  0/blocks.4/post_attention_layernorm/Cast_output_0 4/blocks.4/post_attention_layernorm/Constant_output_0//blocks.4/post_attention_layernorm/Pow_output_0&/blocks.4/post_attention_layernorm/Pow"Pow  //blocks.4/post_attention_layernorm/Pow_output_06/blocks.4/post_attention_layernorm/ReduceMean_output_0-/blocks.4/post_attention_layernorm/ReduceMean" ReduceMean* axes@* keepdims 6/blocks.4/post_attention_layernorm/Constant_1_output_0-/blocks.4/post_attention_layernorm/Constant_1"Constant*O value*CB9/blocks.4/post_attention_layernorm/Constant_1_attr::valueJ75  6/blocks.4/post_attention_layernorm/ReduceMean_output_0 6/blocks.4/post_attention_layernorm/Constant_1_output_0//blocks.4/post_attention_layernorm/Add_output_0&/blocks.4/post_attention_layernorm/Add"Add  //blocks.4/post_attention_layernorm/Add_output_00/blocks.4/post_attention_layernorm/Sqrt_output_0'/blocks.4/post_attention_layernorm/Sqrt"Sqrt 6/blocks.4/post_attention_layernorm/Constant_2_output_0-/blocks.4/post_attention_layernorm/Constant_2"Constant*O value*CB9/blocks.4/post_attention_layernorm/Constant_2_attr::valueJ?  6/blocks.4/post_attention_layernorm/Constant_2_output_0 0/blocks.4/post_attention_layernorm/Sqrt_output_0//blocks.4/post_attention_layernorm/Div_output_0&/blocks.4/post_attention_layernorm/Div"Div  0/blocks.4/post_attention_layernorm/Cast_output_02/blocks.4/post_attention_layernorm/Cast_1_output_0)/blocks.4/post_attention_layernorm/Cast_1"Cast* to  2/blocks.4/post_attention_layernorm/Cast_1_output_0 //blocks.4/post_attention_layernorm/Div_output_0//blocks.4/post_attention_layernorm/Mul_output_0&/blocks.4/post_attention_layernorm/Mul"Mul  //blocks.4/post_attention_layernorm/Mul_output_0 (blocks.4.post_attention_layernorm.weight1/blocks.4/post_attention_layernorm/Mul_1_output_0(/blocks.4/post_attention_layernorm/Mul_1"Mul  1/blocks.4/post_attention_layernorm/Mul_1_output_02/blocks.4/post_attention_layernorm/Cast_2_output_0)/blocks.4/post_attention_layernorm/Cast_2"Cast* to  2/blocks.4/post_attention_layernorm/Cast_2_output_0 onnx::MatMul_8702'/blocks.4/mlp/gate_proj/MatMul_output_0/blocks.4/mlp/gate_proj/MatMul"MatMul w '/blocks.4/mlp/gate_proj/MatMul_output_0%/blocks.4/mlp/act_fn/Sigmoid_output_0/blocks.4/mlp/act_fn/Sigmoid"Sigmoid  '/blocks.4/mlp/gate_proj/MatMul_output_0 %/blocks.4/mlp/act_fn/Sigmoid_output_0!/blocks.4/mlp/act_fn/Mul_output_0/blocks.4/mlp/act_fn/Mul"Mul  2/blocks.4/post_attention_layernorm/Cast_2_output_0 onnx::MatMul_8703%/blocks.4/mlp/up_proj/MatMul_output_0/blocks.4/mlp/up_proj/MatMul"MatMul ~ !/blocks.4/mlp/act_fn/Mul_output_0 %/blocks.4/mlp/up_proj/MatMul_output_0/blocks.4/mlp/Mul_output_0/blocks.4/mlp/Mul"Mul  /blocks.4/mlp/Mul_output_0 onnx::MatMul_8704'/blocks.4/mlp/down_proj/MatMul_output_0/blocks.4/mlp/down_proj/MatMul"MatMul  2/blocks.4/post_attention_layernorm/Cast_1_output_0 '/blocks.4/mlp/down_proj/MatMul_output_0/blocks.4/Add_1_output_0/blocks.4/Add_1"Add Z/Constant_output_0 /Constant"Constant*/ value*#B/Constant_attr::valueJ Y past_key_values /Constant_output_0/Gather_5_output_0 /Gather_5"Gather* axis /blocks.5/Constant_output_0/blocks.5/Constant"Constant*J value*>B/blocks.5/Constant_attr::valueJ  /blocks.4/Add_1_output_0 /blocks.5/Constant_output_0/blocks.5/Reshape_output_0/blocks.5/Reshape"Reshape* allowzero v /blocks.5/Reshape_output_0'/blocks.5/input_layernorm/Cast_output_0/blocks.5/input_layernorm/Cast"Cast* to +/blocks.5/input_layernorm/Constant_output_0"/blocks.5/input_layernorm/Constant"Constant*D value*8B./blocks.5/input_layernorm/Constant_attr::valueJ@  '/blocks.5/input_layernorm/Cast_output_0 +/blocks.5/input_layernorm/Constant_output_0&/blocks.5/input_layernorm/Pow_output_0/blocks.5/input_layernorm/Pow"Pow  &/blocks.5/input_layernorm/Pow_output_0-/blocks.5/input_layernorm/ReduceMean_output_0$/blocks.5/input_layernorm/ReduceMean" ReduceMean* axes@* keepdims -/blocks.5/input_layernorm/Constant_1_output_0$/blocks.5/input_layernorm/Constant_1"Constant*F value*:B0/blocks.5/input_layernorm/Constant_1_attr::valueJ75  -/blocks.5/input_layernorm/ReduceMean_output_0 -/blocks.5/input_layernorm/Constant_1_output_0&/blocks.5/input_layernorm/Add_output_0/blocks.5/input_layernorm/Add"Add w &/blocks.5/input_layernorm/Add_output_0'/blocks.5/input_layernorm/Sqrt_output_0/blocks.5/input_layernorm/Sqrt"Sqrt -/blocks.5/input_layernorm/Constant_2_output_0$/blocks.5/input_layernorm/Constant_2"Constant*F value*:B0/blocks.5/input_layernorm/Constant_2_attr::valueJ?  -/blocks.5/input_layernorm/Constant_2_output_0 '/blocks.5/input_layernorm/Sqrt_output_0&/blocks.5/input_layernorm/Div_output_0/blocks.5/input_layernorm/Div"Div  '/blocks.5/input_layernorm/Cast_output_0)/blocks.5/input_layernorm/Cast_1_output_0 /blocks.5/input_layernorm/Cast_1"Cast* to  )/blocks.5/input_layernorm/Cast_1_output_0 &/blocks.5/input_layernorm/Div_output_0&/blocks.5/input_layernorm/Mul_output_0/blocks.5/input_layernorm/Mul"Mul  &/blocks.5/input_layernorm/Mul_output_0 blocks.5.input_layernorm.weight(/blocks.5/input_layernorm/Mul_1_output_0/blocks.5/input_layernorm/Mul_1"Mul  (/blocks.5/input_layernorm/Mul_1_output_0)/blocks.5/input_layernorm/Cast_2_output_0 /blocks.5/input_layernorm/Cast_2"Cast* to q )/blocks.5/input_layernorm/Cast_2_output_0"/blocks.5/self_attn/Shape_output_0/blocks.5/self_attn/Shape"Shape %/blocks.5/self_attn/Constant_output_0/blocks.5/self_attn/Constant"Constant*B value*6B(/blocks.5/self_attn/Constant_attr::valueJ  "/blocks.5/self_attn/Shape_output_0 %/blocks.5/self_attn/Constant_output_0#/blocks.5/self_attn/Gather_output_0/blocks.5/self_attn/Gather"Gather* axis u )/blocks.5/input_layernorm/Cast_2_output_0$/blocks.5/self_attn/Shape_1_output_0/blocks.5/self_attn/Shape_1"Shape '/blocks.5/self_attn/Constant_1_output_0/blocks.5/self_attn/Constant_1"Constant*D value*8B*/blocks.5/self_attn/Constant_1_attr::valueJ  $/blocks.5/self_attn/Shape_1_output_0 '/blocks.5/self_attn/Constant_1_output_0%/blocks.5/self_attn/Gather_1_output_0/blocks.5/self_attn/Gather_1"Gather* axis  )/blocks.5/input_layernorm/Cast_2_output_0 onnx::MatMul_8705*/blocks.5/self_attn/q_proj/MatMul_output_0!/blocks.5/self_attn/q_proj/MatMul"MatMul  )/blocks.5/input_layernorm/Cast_2_output_0 onnx::MatMul_8706*/blocks.5/self_attn/k_proj/MatMul_output_0!/blocks.5/self_attn/k_proj/MatMul"MatMul  )/blocks.5/input_layernorm/Cast_2_output_0 onnx::MatMul_8707*/blocks.5/self_attn/v_proj/MatMul_output_0!/blocks.5/self_attn/v_proj/MatMul"MatMul fonnx::Unsqueeze_1825 Constant_3867"Constant*5 value*)BConstant_3867_attr::valueJ  #/blocks.5/self_attn/Gather_output_0 onnx::Unsqueeze_1825&/blocks.5/self_attn/Unsqueeze_output_0/blocks.5/self_attn/Unsqueeze" Unsqueeze fonnx::Unsqueeze_1827 Constant_3869"Constant*5 value*)BConstant_3869_attr::valueJ  %/blocks.5/self_attn/Gather_1_output_0 onnx::Unsqueeze_1827(/blocks.5/self_attn/Unsqueeze_1_output_0/blocks.5/self_attn/Unsqueeze_1" Unsqueeze '/blocks.5/self_attn/Constant_2_output_0/blocks.5/self_attn/Constant_2"Constant*F value*:B*/blocks.5/self_attn/Constant_2_attr::valueJ '/blocks.5/self_attn/Constant_3_output_0/blocks.5/self_attn/Constant_3"Constant*F value*:B*/blocks.5/self_attn/Constant_3_attr::valueJ  &/blocks.5/self_attn/Unsqueeze_output_0 (/blocks.5/self_attn/Unsqueeze_1_output_0 '/blocks.5/self_attn/Constant_2_output_0 '/blocks.5/self_attn/Constant_3_output_0#/blocks.5/self_attn/Concat_output_0/blocks.5/self_attn/Concat"Concat* axis  */blocks.5/self_attn/q_proj/MatMul_output_0 #/blocks.5/self_attn/Concat_output_0$/blocks.5/self_attn/Reshape_output_0/blocks.5/self_attn/Reshape"Reshape* allowzero fonnx::Unsqueeze_1835 Constant_3875"Constant*5 value*)BConstant_3875_attr::valueJ  #/blocks.5/self_attn/Gather_output_0 onnx::Unsqueeze_1835(/blocks.5/self_attn/Unsqueeze_2_output_0/blocks.5/self_attn/Unsqueeze_2" Unsqueeze fonnx::Unsqueeze_1837 Constant_3877"Constant*5 value*)BConstant_3877_attr::valueJ  %/blocks.5/self_attn/Gather_1_output_0 onnx::Unsqueeze_1837(/blocks.5/self_attn/Unsqueeze_3_output_0/blocks.5/self_attn/Unsqueeze_3" Unsqueeze '/blocks.5/self_attn/Constant_4_output_0/blocks.5/self_attn/Constant_4"Constant*F value*:B*/blocks.5/self_attn/Constant_4_attr::valueJ '/blocks.5/self_attn/Constant_5_output_0/blocks.5/self_attn/Constant_5"Constant*F value*:B*/blocks.5/self_attn/Constant_5_attr::valueJ  (/blocks.5/self_attn/Unsqueeze_2_output_0 (/blocks.5/self_attn/Unsqueeze_3_output_0 '/blocks.5/self_attn/Constant_4_output_0 '/blocks.5/self_attn/Constant_5_output_0%/blocks.5/self_attn/Concat_1_output_0/blocks.5/self_attn/Concat_1"Concat* axis fonnx::Unsqueeze_1844 Constant_3882"Constant*5 value*)BConstant_3882_attr::valueJ  #/blocks.5/self_attn/Gather_output_0 onnx::Unsqueeze_1844(/blocks.5/self_attn/Unsqueeze_4_output_0/blocks.5/self_attn/Unsqueeze_4" Unsqueeze fonnx::Unsqueeze_1846 Constant_3884"Constant*5 value*)BConstant_3884_attr::valueJ  %/blocks.5/self_attn/Gather_1_output_0 onnx::Unsqueeze_1846(/blocks.5/self_attn/Unsqueeze_5_output_0/blocks.5/self_attn/Unsqueeze_5" Unsqueeze '/blocks.5/self_attn/Constant_6_output_0/blocks.5/self_attn/Constant_6"Constant*F value*:B*/blocks.5/self_attn/Constant_6_attr::valueJ '/blocks.5/self_attn/Constant_7_output_0/blocks.5/self_attn/Constant_7"Constant*F value*:B*/blocks.5/self_attn/Constant_7_attr::valueJ  (/blocks.5/self_attn/Unsqueeze_4_output_0 (/blocks.5/self_attn/Unsqueeze_5_output_0 '/blocks.5/self_attn/Constant_6_output_0 '/blocks.5/self_attn/Constant_7_output_0%/blocks.5/self_attn/Concat_2_output_0/blocks.5/self_attn/Concat_2"Concat* axis  */blocks.5/self_attn/k_proj/MatMul_output_0 %/blocks.5/self_attn/Concat_1_output_0&/blocks.5/self_attn/Reshape_1_output_0/blocks.5/self_attn/Reshape_1"Reshape* allowzero  */blocks.5/self_attn/v_proj/MatMul_output_0 %/blocks.5/self_attn/Concat_2_output_0&/blocks.5/self_attn/Reshape_2_output_0/blocks.5/self_attn/Reshape_2"Reshape* allowzero  $/blocks.5/self_attn/Reshape_output_0(/blocks.5/self_attn/q_norm/Cast_output_0/blocks.5/self_attn/q_norm/Cast"Cast* to ,/blocks.5/self_attn/q_norm/Constant_output_0#/blocks.5/self_attn/q_norm/Constant"Constant*E value*9B//blocks.5/self_attn/q_norm/Constant_attr::valueJ@  (/blocks.5/self_attn/q_norm/Cast_output_0 ,/blocks.5/self_attn/q_norm/Constant_output_0'/blocks.5/self_attn/q_norm/Pow_output_0/blocks.5/self_attn/q_norm/Pow"Pow  '/blocks.5/self_attn/q_norm/Pow_output_0./blocks.5/self_attn/q_norm/ReduceMean_output_0%/blocks.5/self_attn/q_norm/ReduceMean" ReduceMean* axes@* keepdims ./blocks.5/self_attn/q_norm/Constant_1_output_0%/blocks.5/self_attn/q_norm/Constant_1"Constant*G value*;B1/blocks.5/self_attn/q_norm/Constant_1_attr::valueJ75  ./blocks.5/self_attn/q_norm/ReduceMean_output_0 ./blocks.5/self_attn/q_norm/Constant_1_output_0'/blocks.5/self_attn/q_norm/Add_output_0/blocks.5/self_attn/q_norm/Add"Add z '/blocks.5/self_attn/q_norm/Add_output_0(/blocks.5/self_attn/q_norm/Sqrt_output_0/blocks.5/self_attn/q_norm/Sqrt"Sqrt ./blocks.5/self_attn/q_norm/Constant_2_output_0%/blocks.5/self_attn/q_norm/Constant_2"Constant*G value*;B1/blocks.5/self_attn/q_norm/Constant_2_attr::valueJ?  ./blocks.5/self_attn/q_norm/Constant_2_output_0 (/blocks.5/self_attn/q_norm/Sqrt_output_0'/blocks.5/self_attn/q_norm/Div_output_0/blocks.5/self_attn/q_norm/Div"Div  (/blocks.5/self_attn/q_norm/Cast_output_0*/blocks.5/self_attn/q_norm/Cast_1_output_0!/blocks.5/self_attn/q_norm/Cast_1"Cast* to  */blocks.5/self_attn/q_norm/Cast_1_output_0 '/blocks.5/self_attn/q_norm/Div_output_0'/blocks.5/self_attn/q_norm/Mul_output_0/blocks.5/self_attn/q_norm/Mul"Mul  '/blocks.5/self_attn/q_norm/Mul_output_0 blocks.5.self_attn.q_norm.weight)/blocks.5/self_attn/q_norm/Mul_1_output_0 /blocks.5/self_attn/q_norm/Mul_1"Mul  )/blocks.5/self_attn/q_norm/Mul_1_output_0*/blocks.5/self_attn/q_norm/Cast_2_output_0!/blocks.5/self_attn/q_norm/Cast_2"Cast* to  &/blocks.5/self_attn/Reshape_1_output_0(/blocks.5/self_attn/k_norm/Cast_output_0/blocks.5/self_attn/k_norm/Cast"Cast* to ,/blocks.5/self_attn/k_norm/Constant_output_0#/blocks.5/self_attn/k_norm/Constant"Constant*E value*9B//blocks.5/self_attn/k_norm/Constant_attr::valueJ@  (/blocks.5/self_attn/k_norm/Cast_output_0 ,/blocks.5/self_attn/k_norm/Constant_output_0'/blocks.5/self_attn/k_norm/Pow_output_0/blocks.5/self_attn/k_norm/Pow"Pow  '/blocks.5/self_attn/k_norm/Pow_output_0./blocks.5/self_attn/k_norm/ReduceMean_output_0%/blocks.5/self_attn/k_norm/ReduceMean" ReduceMean* axes@* keepdims ./blocks.5/self_attn/k_norm/Constant_1_output_0%/blocks.5/self_attn/k_norm/Constant_1"Constant*G value*;B1/blocks.5/self_attn/k_norm/Constant_1_attr::valueJ75  ./blocks.5/self_attn/k_norm/ReduceMean_output_0 ./blocks.5/self_attn/k_norm/Constant_1_output_0'/blocks.5/self_attn/k_norm/Add_output_0/blocks.5/self_attn/k_norm/Add"Add z '/blocks.5/self_attn/k_norm/Add_output_0(/blocks.5/self_attn/k_norm/Sqrt_output_0/blocks.5/self_attn/k_norm/Sqrt"Sqrt ./blocks.5/self_attn/k_norm/Constant_2_output_0%/blocks.5/self_attn/k_norm/Constant_2"Constant*G value*;B1/blocks.5/self_attn/k_norm/Constant_2_attr::valueJ?  ./blocks.5/self_attn/k_norm/Constant_2_output_0 (/blocks.5/self_attn/k_norm/Sqrt_output_0'/blocks.5/self_attn/k_norm/Div_output_0/blocks.5/self_attn/k_norm/Div"Div  (/blocks.5/self_attn/k_norm/Cast_output_0*/blocks.5/self_attn/k_norm/Cast_1_output_0!/blocks.5/self_attn/k_norm/Cast_1"Cast* to  */blocks.5/self_attn/k_norm/Cast_1_output_0 '/blocks.5/self_attn/k_norm/Div_output_0'/blocks.5/self_attn/k_norm/Mul_output_0/blocks.5/self_attn/k_norm/Mul"Mul  '/blocks.5/self_attn/k_norm/Mul_output_0 blocks.5.self_attn.k_norm.weight)/blocks.5/self_attn/k_norm/Mul_1_output_0 /blocks.5/self_attn/k_norm/Mul_1"Mul  )/blocks.5/self_attn/k_norm/Mul_1_output_0*/blocks.5/self_attn/k_norm/Cast_2_output_0!/blocks.5/self_attn/k_norm/Cast_2"Cast* to  */blocks.5/self_attn/q_norm/Cast_2_output_0 %/blocks.0/self_attn/Gather_2_output_0 /blocks.5/self_attn/Mul_output_0/blocks.5/self_attn/Mul"Mul v */blocks.5/self_attn/q_norm/Cast_2_output_0$/blocks.5/self_attn/Shape_2_output_0/blocks.5/self_attn/Shape_2"Shape '/blocks.5/self_attn/Constant_8_output_0/blocks.5/self_attn/Constant_8"Constant*D value*8B*/blocks.5/self_attn/Constant_8_attr::valueJ  $/blocks.5/self_attn/Shape_2_output_0 '/blocks.5/self_attn/Constant_8_output_0%/blocks.5/self_attn/Gather_2_output_0/blocks.5/self_attn/Gather_2"Gather* axis '/blocks.5/self_attn/Constant_9_output_0/blocks.5/self_attn/Constant_9"Constant*D value*8B*/blocks.5/self_attn/Constant_9_attr::valueJ  %/blocks.5/self_attn/Gather_2_output_0 '/blocks.5/self_attn/Constant_9_output_0 /blocks.5/self_attn/Div_output_0/blocks.5/self_attn/Div"Div p /blocks.5/self_attn/Div_output_0!/blocks.5/self_attn/Cast_output_0/blocks.5/self_attn/Cast"Cast* to u !/blocks.5/self_attn/Cast_output_0#/blocks.5/self_attn/Cast_1_output_0/blocks.5/self_attn/Cast_1"Cast* to (/blocks.5/self_attn/Constant_10_output_0/blocks.5/self_attn/Constant_10"Constant*G value*;B+/blocks.5/self_attn/Constant_10_attr::valueJ (/blocks.5/self_attn/Constant_11_output_0/blocks.5/self_attn/Constant_11"Constant*G value*;B+/blocks.5/self_attn/Constant_11_attr::valueJ (/blocks.5/self_attn/Constant_12_output_0/blocks.5/self_attn/Constant_12"Constant*G value*;B+/blocks.5/self_attn/Constant_12_attr::valueJ  #/blocks.5/self_attn/Cast_1_output_0 (/blocks.5/self_attn/Constant_12_output_0(/blocks.5/self_attn/Unsqueeze_6_output_0/blocks.5/self_attn/Unsqueeze_6" Unsqueeze (/blocks.5/self_attn/Constant_13_output_0/blocks.5/self_attn/Constant_13"Constant*G value*;B+/blocks.5/self_attn/Constant_13_attr::valueJ  */blocks.5/self_attn/q_norm/Cast_2_output_0 (/blocks.5/self_attn/Constant_11_output_0 (/blocks.5/self_attn/Unsqueeze_6_output_0 (/blocks.5/self_attn/Constant_10_output_0 (/blocks.5/self_attn/Constant_13_output_0"/blocks.5/self_attn/Slice_output_0/blocks.5/self_attn/Slice"Slice (/blocks.5/self_attn/Constant_14_output_0/blocks.5/self_attn/Constant_14"Constant*G value*;B+/blocks.5/self_attn/Constant_14_attr::valueJ (/blocks.5/self_attn/Constant_15_output_0/blocks.5/self_attn/Constant_15"Constant*G value*;B+/blocks.5/self_attn/Constant_15_attr::valueJ  #/blocks.5/self_attn/Cast_1_output_0 (/blocks.5/self_attn/Constant_15_output_0(/blocks.5/self_attn/Unsqueeze_7_output_0/blocks.5/self_attn/Unsqueeze_7" Unsqueeze (/blocks.5/self_attn/Constant_16_output_0/blocks.5/self_attn/Constant_16"Constant*G value*;B+/blocks.5/self_attn/Constant_16_attr::valueJ (/blocks.5/self_attn/Constant_17_output_0/blocks.5/self_attn/Constant_17"Constant*G value*;B+/blocks.5/self_attn/Constant_17_attr::valueJ  */blocks.5/self_attn/q_norm/Cast_2_output_0 (/blocks.5/self_attn/Unsqueeze_7_output_0 (/blocks.5/self_attn/Constant_16_output_0 (/blocks.5/self_attn/Constant_14_output_0 (/blocks.5/self_attn/Constant_17_output_0$/blocks.5/self_attn/Slice_1_output_0/blocks.5/self_attn/Slice_1"Slice f $/blocks.5/self_attn/Slice_1_output_0 /blocks.5/self_attn/Neg_output_0/blocks.5/self_attn/Neg"Neg  /blocks.5/self_attn/Neg_output_0 "/blocks.5/self_attn/Slice_output_0%/blocks.5/self_attn/Concat_3_output_0/blocks.5/self_attn/Concat_3"Concat* axis  %/blocks.5/self_attn/Concat_3_output_0 %/blocks.0/self_attn/Gather_3_output_0"/blocks.5/self_attn/Mul_1_output_0/blocks.5/self_attn/Mul_1"Mul  /blocks.5/self_attn/Mul_output_0 "/blocks.5/self_attn/Mul_1_output_0 /blocks.5/self_attn/Add_output_0/blocks.5/self_attn/Add"Add  */blocks.5/self_attn/k_norm/Cast_2_output_0 %/blocks.0/self_attn/Gather_2_output_0"/blocks.5/self_attn/Mul_2_output_0/blocks.5/self_attn/Mul_2"Mul v */blocks.5/self_attn/k_norm/Cast_2_output_0$/blocks.5/self_attn/Shape_3_output_0/blocks.5/self_attn/Shape_3"Shape (/blocks.5/self_attn/Constant_18_output_0/blocks.5/self_attn/Constant_18"Constant*E value*9B+/blocks.5/self_attn/Constant_18_attr::valueJ  $/blocks.5/self_attn/Shape_3_output_0 (/blocks.5/self_attn/Constant_18_output_0%/blocks.5/self_attn/Gather_3_output_0/blocks.5/self_attn/Gather_3"Gather* axis (/blocks.5/self_attn/Constant_19_output_0/blocks.5/self_attn/Constant_19"Constant*E value*9B+/blocks.5/self_attn/Constant_19_attr::valueJ  %/blocks.5/self_attn/Gather_3_output_0 (/blocks.5/self_attn/Constant_19_output_0"/blocks.5/self_attn/Div_1_output_0/blocks.5/self_attn/Div_1"Div v "/blocks.5/self_attn/Div_1_output_0#/blocks.5/self_attn/Cast_2_output_0/blocks.5/self_attn/Cast_2"Cast* to w #/blocks.5/self_attn/Cast_2_output_0#/blocks.5/self_attn/Cast_3_output_0/blocks.5/self_attn/Cast_3"Cast* to (/blocks.5/self_attn/Constant_20_output_0/blocks.5/self_attn/Constant_20"Constant*G value*;B+/blocks.5/self_attn/Constant_20_attr::valueJ (/blocks.5/self_attn/Constant_21_output_0/blocks.5/self_attn/Constant_21"Constant*G value*;B+/blocks.5/self_attn/Constant_21_attr::valueJ (/blocks.5/self_attn/Constant_22_output_0/blocks.5/self_attn/Constant_22"Constant*G value*;B+/blocks.5/self_attn/Constant_22_attr::valueJ  #/blocks.5/self_attn/Cast_3_output_0 (/blocks.5/self_attn/Constant_22_output_0(/blocks.5/self_attn/Unsqueeze_8_output_0/blocks.5/self_attn/Unsqueeze_8" Unsqueeze (/blocks.5/self_attn/Constant_23_output_0/blocks.5/self_attn/Constant_23"Constant*G value*;B+/blocks.5/self_attn/Constant_23_attr::valueJ  */blocks.5/self_attn/k_norm/Cast_2_output_0 (/blocks.5/self_attn/Constant_21_output_0 (/blocks.5/self_attn/Unsqueeze_8_output_0 (/blocks.5/self_attn/Constant_20_output_0 (/blocks.5/self_attn/Constant_23_output_0$/blocks.5/self_attn/Slice_2_output_0/blocks.5/self_attn/Slice_2"Slice (/blocks.5/self_attn/Constant_24_output_0/blocks.5/self_attn/Constant_24"Constant*G value*;B+/blocks.5/self_attn/Constant_24_attr::valueJ (/blocks.5/self_attn/Constant_25_output_0/blocks.5/self_attn/Constant_25"Constant*G value*;B+/blocks.5/self_attn/Constant_25_attr::valueJ  #/blocks.5/self_attn/Cast_3_output_0 (/blocks.5/self_attn/Constant_25_output_0(/blocks.5/self_attn/Unsqueeze_9_output_0/blocks.5/self_attn/Unsqueeze_9" Unsqueeze (/blocks.5/self_attn/Constant_26_output_0/blocks.5/self_attn/Constant_26"Constant*G value*;B+/blocks.5/self_attn/Constant_26_attr::valueJ (/blocks.5/self_attn/Constant_27_output_0/blocks.5/self_attn/Constant_27"Constant*G value*;B+/blocks.5/self_attn/Constant_27_attr::valueJ  */blocks.5/self_attn/k_norm/Cast_2_output_0 (/blocks.5/self_attn/Unsqueeze_9_output_0 (/blocks.5/self_attn/Constant_26_output_0 (/blocks.5/self_attn/Constant_24_output_0 (/blocks.5/self_attn/Constant_27_output_0$/blocks.5/self_attn/Slice_3_output_0/blocks.5/self_attn/Slice_3"Slice j $/blocks.5/self_attn/Slice_3_output_0"/blocks.5/self_attn/Neg_1_output_0/blocks.5/self_attn/Neg_1"Neg  "/blocks.5/self_attn/Neg_1_output_0 $/blocks.5/self_attn/Slice_2_output_0%/blocks.5/self_attn/Concat_4_output_0/blocks.5/self_attn/Concat_4"Concat* axis  %/blocks.5/self_attn/Concat_4_output_0 %/blocks.0/self_attn/Gather_3_output_0"/blocks.5/self_attn/Mul_3_output_0/blocks.5/self_attn/Mul_3"Mul  "/blocks.5/self_attn/Mul_2_output_0 "/blocks.5/self_attn/Mul_3_output_0"/blocks.5/self_attn/Add_1_output_0/blocks.5/self_attn/Add_1"Add  /Gather_5_output_0 /rotary/Constant_3_output_0%/blocks.5/self_attn/Gather_4_output_0/blocks.5/self_attn/Gather_4"Gather* axis  /Gather_5_output_0 /rotary/Constant_8_output_0%/blocks.5/self_attn/Gather_5_output_0/blocks.5/self_attn/Gather_5"Gather* axis  %/blocks.5/self_attn/Gather_4_output_0 "/blocks.5/self_attn/Add_1_output_0%/blocks.5/self_attn/Concat_5_output_0/blocks.5/self_attn/Concat_5"Concat* axis  %/blocks.5/self_attn/Gather_5_output_0 &/blocks.5/self_attn/Reshape_2_output_0%/blocks.5/self_attn/Concat_6_output_0/blocks.5/self_attn/Concat_6"Concat* axis (/blocks.5/self_attn/Constant_28_output_0/blocks.5/self_attn/Constant_28"Constant*G value*;B+/blocks.5/self_attn/Constant_28_attr::valueJ  %/blocks.5/self_attn/Concat_5_output_0 (/blocks.5/self_attn/Constant_28_output_0)/blocks.5/self_attn/Unsqueeze_10_output_0 /blocks.5/self_attn/Unsqueeze_10" Unsqueeze (/blocks.5/self_attn/Constant_29_output_0/blocks.5/self_attn/Constant_29"Constant*G value*;B+/blocks.5/self_attn/Constant_29_attr::valueJ  %/blocks.5/self_attn/Concat_6_output_0 (/blocks.5/self_attn/Constant_29_output_0)/blocks.5/self_attn/Unsqueeze_11_output_0 /blocks.5/self_attn/Unsqueeze_11" Unsqueeze  )/blocks.5/self_attn/Unsqueeze_10_output_0 )/blocks.5/self_attn/Unsqueeze_11_output_0%/blocks.5/self_attn/Concat_7_output_0/blocks.5/self_attn/Concat_7"Concat* axis  /blocks.5/self_attn/Add_output_0&/blocks.5/self_attn/Transpose_output_0/blocks.5/self_attn/Transpose" Transpose* perm@@@@  %/blocks.5/self_attn/Concat_5_output_0(/blocks.5/self_attn/Transpose_1_output_0/blocks.5/self_attn/Transpose_1" Transpose* perm@@@@  %/blocks.5/self_attn/Concat_6_output_0(/blocks.5/self_attn/Transpose_2_output_0/blocks.5/self_attn/Transpose_2" Transpose* perm@@@@ t (/blocks.5/self_attn/Transpose_1_output_0$/blocks.5/self_attn/Shape_4_output_0/blocks.5/self_attn/Shape_4"Shape (/blocks.5/self_attn/Constant_30_output_0/blocks.5/self_attn/Constant_30"Constant*E value*9B+/blocks.5/self_attn/Constant_30_attr::valueJ  $/blocks.5/self_attn/Shape_4_output_0 (/blocks.5/self_attn/Constant_30_output_0%/blocks.5/self_attn/Gather_6_output_0/blocks.5/self_attn/Gather_6"Gather* axis t (/blocks.5/self_attn/Transpose_1_output_0$/blocks.5/self_attn/Shape_5_output_0/blocks.5/self_attn/Shape_5"Shape (/blocks.5/self_attn/Constant_31_output_0/blocks.5/self_attn/Constant_31"Constant*E value*9B+/blocks.5/self_attn/Constant_31_attr::valueJ  $/blocks.5/self_attn/Shape_5_output_0 (/blocks.5/self_attn/Constant_31_output_0%/blocks.5/self_attn/Gather_7_output_0/blocks.5/self_attn/Gather_7"Gather* axis t (/blocks.5/self_attn/Transpose_1_output_0$/blocks.5/self_attn/Shape_6_output_0/blocks.5/self_attn/Shape_6"Shape (/blocks.5/self_attn/Constant_32_output_0/blocks.5/self_attn/Constant_32"Constant*E value*9B+/blocks.5/self_attn/Constant_32_attr::valueJ  $/blocks.5/self_attn/Shape_6_output_0 (/blocks.5/self_attn/Constant_32_output_0%/blocks.5/self_attn/Gather_8_output_0/blocks.5/self_attn/Gather_8"Gather* axis t (/blocks.5/self_attn/Transpose_1_output_0$/blocks.5/self_attn/Shape_7_output_0/blocks.5/self_attn/Shape_7"Shape (/blocks.5/self_attn/Constant_33_output_0/blocks.5/self_attn/Constant_33"Constant*E value*9B+/blocks.5/self_attn/Constant_33_attr::valueJ  $/blocks.5/self_attn/Shape_7_output_0 (/blocks.5/self_attn/Constant_33_output_0%/blocks.5/self_attn/Gather_9_output_0/blocks.5/self_attn/Gather_9"Gather* axis (/blocks.5/self_attn/Constant_34_output_0/blocks.5/self_attn/Constant_34"Constant*G value*;B+/blocks.5/self_attn/Constant_34_attr::valueJ  (/blocks.5/self_attn/Transpose_1_output_0 (/blocks.5/self_attn/Constant_34_output_0)/blocks.5/self_attn/Unsqueeze_12_output_0 /blocks.5/self_attn/Unsqueeze_12" Unsqueeze (/blocks.5/self_attn/Constant_35_output_0/blocks.5/self_attn/Constant_35"Constant*G value*;B+/blocks.5/self_attn/Constant_35_attr::valueJ  %/blocks.5/self_attn/Gather_6_output_0 (/blocks.5/self_attn/Constant_35_output_0)/blocks.5/self_attn/Unsqueeze_13_output_0 /blocks.5/self_attn/Unsqueeze_13" Unsqueeze (/blocks.5/self_attn/Constant_36_output_0/blocks.5/self_attn/Constant_36"Constant*G value*;B+/blocks.5/self_attn/Constant_36_attr::valueJ  %/blocks.5/self_attn/Gather_7_output_0 (/blocks.5/self_attn/Constant_36_output_0)/blocks.5/self_attn/Unsqueeze_14_output_0 /blocks.5/self_attn/Unsqueeze_14" Unsqueeze (/blocks.5/self_attn/Constant_37_output_0/blocks.5/self_attn/Constant_37"Constant*G value*;B+/blocks.5/self_attn/Constant_37_attr::valueJ (/blocks.5/self_attn/Constant_38_output_0/blocks.5/self_attn/Constant_38"Constant*G value*;B+/blocks.5/self_attn/Constant_38_attr::valueJ  %/blocks.5/self_attn/Gather_8_output_0 (/blocks.5/self_attn/Constant_38_output_0)/blocks.5/self_attn/Unsqueeze_15_output_0 /blocks.5/self_attn/Unsqueeze_15" Unsqueeze (/blocks.5/self_attn/Constant_39_output_0/blocks.5/self_attn/Constant_39"Constant*G value*;B+/blocks.5/self_attn/Constant_39_attr::valueJ  %/blocks.5/self_attn/Gather_9_output_0 (/blocks.5/self_attn/Constant_39_output_0)/blocks.5/self_attn/Unsqueeze_16_output_0 /blocks.5/self_attn/Unsqueeze_16" Unsqueeze  )/blocks.5/self_attn/Unsqueeze_13_output_0 )/blocks.5/self_attn/Unsqueeze_14_output_0 (/blocks.5/self_attn/Constant_37_output_0 )/blocks.5/self_attn/Unsqueeze_15_output_0 )/blocks.5/self_attn/Unsqueeze_16_output_0%/blocks.5/self_attn/Concat_8_output_0/blocks.5/self_attn/Concat_8"Concat* axis (/blocks.5/self_attn/Constant_40_output_0/blocks.5/self_attn/Constant_40"Constant*G value*;B+/blocks.5/self_attn/Constant_40_attr::valueJ  %/blocks.5/self_attn/Concat_8_output_0 (/blocks.5/self_attn/Constant_40_output_0&/blocks.5/self_attn/Reshape_3_output_0/blocks.5/self_attn/Reshape_3"Reshape* allowzero r &/blocks.5/self_attn/Reshape_3_output_0$/blocks.5/self_attn/Shape_8_output_0/blocks.5/self_attn/Shape_8"Shape  $/blocks.5/self_attn/Shape_8_output_0,/blocks.5/self_attn/ConstantOfShape_output_0#/blocks.5/self_attn/ConstantOfShape"ConstantOfShape*K value*?B//blocks.5/self_attn/ConstantOfShape_attr::valueJ (/blocks.5/self_attn/Constant_41_output_0/blocks.5/self_attn/Constant_41"Constant*E value*9B+/blocks.5/self_attn/Constant_41_attr::valueJ  ,/blocks.5/self_attn/ConstantOfShape_output_0 (/blocks.5/self_attn/Constant_41_output_0"/blocks.5/self_attn/Mul_4_output_0/blocks.5/self_attn/Mul_4"Mul  &/blocks.5/self_attn/Reshape_3_output_0 "/blocks.5/self_attn/Mul_4_output_0"/blocks.5/self_attn/Equal_output_0/blocks.5/self_attn/Equal"Equal  "/blocks.5/self_attn/Equal_output_0 ,/blocks.5/self_attn/ConstantOfShape_output_0 &/blocks.5/self_attn/Reshape_3_output_0"/blocks.5/self_attn/Where_output_0/blocks.5/self_attn/Where"Where  )/blocks.5/self_attn/Unsqueeze_12_output_0 "/blocks.5/self_attn/Where_output_0#/blocks.5/self_attn/Expand_output_0/blocks.5/self_attn/Expand"Expand (/blocks.5/self_attn/Constant_42_output_0/blocks.5/self_attn/Constant_42"Constant*E value*9B+/blocks.5/self_attn/Constant_42_attr::valueJ  %/blocks.5/self_attn/Gather_7_output_0 (/blocks.5/self_attn/Constant_42_output_0"/blocks.5/self_attn/Mul_5_output_0/blocks.5/self_attn/Mul_5"Mul fonnx::Unsqueeze_1989 Constant_4012"Constant*5 value*)BConstant_4012_attr::valueJ  %/blocks.5/self_attn/Gather_6_output_0 onnx::Unsqueeze_1989)/blocks.5/self_attn/Unsqueeze_17_output_0 /blocks.5/self_attn/Unsqueeze_17" Unsqueeze fonnx::Unsqueeze_1991 Constant_4014"Constant*5 value*)BConstant_4014_attr::valueJ  "/blocks.5/self_attn/Mul_5_output_0 onnx::Unsqueeze_1991)/blocks.5/self_attn/Unsqueeze_18_output_0 /blocks.5/self_attn/Unsqueeze_18" Unsqueeze fonnx::Unsqueeze_1993 Constant_4016"Constant*5 value*)BConstant_4016_attr::valueJ  %/blocks.5/self_attn/Gather_8_output_0 onnx::Unsqueeze_1993)/blocks.5/self_attn/Unsqueeze_19_output_0 /blocks.5/self_attn/Unsqueeze_19" Unsqueeze fonnx::Unsqueeze_1995 Constant_4018"Constant*5 value*)BConstant_4018_attr::valueJ  %/blocks.5/self_attn/Gather_9_output_0 onnx::Unsqueeze_1995)/blocks.5/self_attn/Unsqueeze_20_output_0 /blocks.5/self_attn/Unsqueeze_20" Unsqueeze  )/blocks.5/self_attn/Unsqueeze_17_output_0 )/blocks.5/self_attn/Unsqueeze_18_output_0 )/blocks.5/self_attn/Unsqueeze_19_output_0 )/blocks.5/self_attn/Unsqueeze_20_output_0%/blocks.5/self_attn/Concat_9_output_0/blocks.5/self_attn/Concat_9"Concat* axis  #/blocks.5/self_attn/Expand_output_0 %/blocks.5/self_attn/Concat_9_output_0&/blocks.5/self_attn/Reshape_4_output_0/blocks.5/self_attn/Reshape_4"Reshape* allowzero t (/blocks.5/self_attn/Transpose_2_output_0$/blocks.5/self_attn/Shape_9_output_0/blocks.5/self_attn/Shape_9"Shape (/blocks.5/self_attn/Constant_43_output_0/blocks.5/self_attn/Constant_43"Constant*E value*9B+/blocks.5/self_attn/Constant_43_attr::valueJ  $/blocks.5/self_attn/Shape_9_output_0 (/blocks.5/self_attn/Constant_43_output_0&/blocks.5/self_attn/Gather_10_output_0/blocks.5/self_attn/Gather_10"Gather* axis v (/blocks.5/self_attn/Transpose_2_output_0%/blocks.5/self_attn/Shape_10_output_0/blocks.5/self_attn/Shape_10"Shape (/blocks.5/self_attn/Constant_44_output_0/blocks.5/self_attn/Constant_44"Constant*E value*9B+/blocks.5/self_attn/Constant_44_attr::valueJ  %/blocks.5/self_attn/Shape_10_output_0 (/blocks.5/self_attn/Constant_44_output_0&/blocks.5/self_attn/Gather_11_output_0/blocks.5/self_attn/Gather_11"Gather* axis v (/blocks.5/self_attn/Transpose_2_output_0%/blocks.5/self_attn/Shape_11_output_0/blocks.5/self_attn/Shape_11"Shape (/blocks.5/self_attn/Constant_45_output_0/blocks.5/self_attn/Constant_45"Constant*E value*9B+/blocks.5/self_attn/Constant_45_attr::valueJ  %/blocks.5/self_attn/Shape_11_output_0 (/blocks.5/self_attn/Constant_45_output_0&/blocks.5/self_attn/Gather_12_output_0/blocks.5/self_attn/Gather_12"Gather* axis v (/blocks.5/self_attn/Transpose_2_output_0%/blocks.5/self_attn/Shape_12_output_0/blocks.5/self_attn/Shape_12"Shape (/blocks.5/self_attn/Constant_46_output_0/blocks.5/self_attn/Constant_46"Constant*E value*9B+/blocks.5/self_attn/Constant_46_attr::valueJ  %/blocks.5/self_attn/Shape_12_output_0 (/blocks.5/self_attn/Constant_46_output_0&/blocks.5/self_attn/Gather_13_output_0/blocks.5/self_attn/Gather_13"Gather* axis (/blocks.5/self_attn/Constant_47_output_0/blocks.5/self_attn/Constant_47"Constant*G value*;B+/blocks.5/self_attn/Constant_47_attr::valueJ  (/blocks.5/self_attn/Transpose_2_output_0 (/blocks.5/self_attn/Constant_47_output_0)/blocks.5/self_attn/Unsqueeze_21_output_0 /blocks.5/self_attn/Unsqueeze_21" Unsqueeze (/blocks.5/self_attn/Constant_48_output_0/blocks.5/self_attn/Constant_48"Constant*G value*;B+/blocks.5/self_attn/Constant_48_attr::valueJ  &/blocks.5/self_attn/Gather_10_output_0 (/blocks.5/self_attn/Constant_48_output_0)/blocks.5/self_attn/Unsqueeze_22_output_0 /blocks.5/self_attn/Unsqueeze_22" Unsqueeze (/blocks.5/self_attn/Constant_49_output_0/blocks.5/self_attn/Constant_49"Constant*G value*;B+/blocks.5/self_attn/Constant_49_attr::valueJ  &/blocks.5/self_attn/Gather_11_output_0 (/blocks.5/self_attn/Constant_49_output_0)/blocks.5/self_attn/Unsqueeze_23_output_0 /blocks.5/self_attn/Unsqueeze_23" Unsqueeze (/blocks.5/self_attn/Constant_50_output_0/blocks.5/self_attn/Constant_50"Constant*G value*;B+/blocks.5/self_attn/Constant_50_attr::valueJ (/blocks.5/self_attn/Constant_51_output_0/blocks.5/self_attn/Constant_51"Constant*G value*;B+/blocks.5/self_attn/Constant_51_attr::valueJ  &/blocks.5/self_attn/Gather_12_output_0 (/blocks.5/self_attn/Constant_51_output_0)/blocks.5/self_attn/Unsqueeze_24_output_0 /blocks.5/self_attn/Unsqueeze_24" Unsqueeze (/blocks.5/self_attn/Constant_52_output_0/blocks.5/self_attn/Constant_52"Constant*G value*;B+/blocks.5/self_attn/Constant_52_attr::valueJ  &/blocks.5/self_attn/Gather_13_output_0 (/blocks.5/self_attn/Constant_52_output_0)/blocks.5/self_attn/Unsqueeze_25_output_0 /blocks.5/self_attn/Unsqueeze_25" Unsqueeze  )/blocks.5/self_attn/Unsqueeze_22_output_0 )/blocks.5/self_attn/Unsqueeze_23_output_0 (/blocks.5/self_attn/Constant_50_output_0 )/blocks.5/self_attn/Unsqueeze_24_output_0 )/blocks.5/self_attn/Unsqueeze_25_output_0&/blocks.5/self_attn/Concat_10_output_0/blocks.5/self_attn/Concat_10"Concat* axis (/blocks.5/self_attn/Constant_53_output_0/blocks.5/self_attn/Constant_53"Constant*G value*;B+/blocks.5/self_attn/Constant_53_attr::valueJ  &/blocks.5/self_attn/Concat_10_output_0 (/blocks.5/self_attn/Constant_53_output_0&/blocks.5/self_attn/Reshape_5_output_0/blocks.5/self_attn/Reshape_5"Reshape* allowzero t &/blocks.5/self_attn/Reshape_5_output_0%/blocks.5/self_attn/Shape_13_output_0/blocks.5/self_attn/Shape_13"Shape  %/blocks.5/self_attn/Shape_13_output_0./blocks.5/self_attn/ConstantOfShape_1_output_0%/blocks.5/self_attn/ConstantOfShape_1"ConstantOfShape*M value*AB1/blocks.5/self_attn/ConstantOfShape_1_attr::valueJ (/blocks.5/self_attn/Constant_54_output_0/blocks.5/self_attn/Constant_54"Constant*E value*9B+/blocks.5/self_attn/Constant_54_attr::valueJ  ./blocks.5/self_attn/ConstantOfShape_1_output_0 (/blocks.5/self_attn/Constant_54_output_0"/blocks.5/self_attn/Mul_6_output_0/blocks.5/self_attn/Mul_6"Mul  &/blocks.5/self_attn/Reshape_5_output_0 "/blocks.5/self_attn/Mul_6_output_0$/blocks.5/self_attn/Equal_1_output_0/blocks.5/self_attn/Equal_1"Equal  $/blocks.5/self_attn/Equal_1_output_0 ./blocks.5/self_attn/ConstantOfShape_1_output_0 &/blocks.5/self_attn/Reshape_5_output_0$/blocks.5/self_attn/Where_1_output_0/blocks.5/self_attn/Where_1"Where  )/blocks.5/self_attn/Unsqueeze_21_output_0 $/blocks.5/self_attn/Where_1_output_0%/blocks.5/self_attn/Expand_1_output_0/blocks.5/self_attn/Expand_1"Expand (/blocks.5/self_attn/Constant_55_output_0/blocks.5/self_attn/Constant_55"Constant*E value*9B+/blocks.5/self_attn/Constant_55_attr::valueJ  &/blocks.5/self_attn/Gather_11_output_0 (/blocks.5/self_attn/Constant_55_output_0"/blocks.5/self_attn/Mul_7_output_0/blocks.5/self_attn/Mul_7"Mul fonnx::Unsqueeze_2035 Constant_4057"Constant*5 value*)BConstant_4057_attr::valueJ  &/blocks.5/self_attn/Gather_10_output_0 onnx::Unsqueeze_2035)/blocks.5/self_attn/Unsqueeze_26_output_0 /blocks.5/self_attn/Unsqueeze_26" Unsqueeze fonnx::Unsqueeze_2037 Constant_4059"Constant*5 value*)BConstant_4059_attr::valueJ  "/blocks.5/self_attn/Mul_7_output_0 onnx::Unsqueeze_2037)/blocks.5/self_attn/Unsqueeze_27_output_0 /blocks.5/self_attn/Unsqueeze_27" Unsqueeze fonnx::Unsqueeze_2039 Constant_4061"Constant*5 value*)BConstant_4061_attr::valueJ  &/blocks.5/self_attn/Gather_12_output_0 onnx::Unsqueeze_2039)/blocks.5/self_attn/Unsqueeze_28_output_0 /blocks.5/self_attn/Unsqueeze_28" Unsqueeze fonnx::Unsqueeze_2041 Constant_4063"Constant*5 value*)BConstant_4063_attr::valueJ  &/blocks.5/self_attn/Gather_13_output_0 onnx::Unsqueeze_2041)/blocks.5/self_attn/Unsqueeze_29_output_0 /blocks.5/self_attn/Unsqueeze_29" Unsqueeze  )/blocks.5/self_attn/Unsqueeze_26_output_0 )/blocks.5/self_attn/Unsqueeze_27_output_0 )/blocks.5/self_attn/Unsqueeze_28_output_0 )/blocks.5/self_attn/Unsqueeze_29_output_0&/blocks.5/self_attn/Concat_11_output_0/blocks.5/self_attn/Concat_11"Concat* axis  %/blocks.5/self_attn/Expand_1_output_0 &/blocks.5/self_attn/Concat_11_output_0&/blocks.5/self_attn/Reshape_6_output_0/blocks.5/self_attn/Reshape_6"Reshape* allowzero  &/blocks.5/self_attn/Transpose_output_0 &/blocks.5/self_attn/Reshape_4_output_0#/blocks.5/self_attn/MatMul_output_0/blocks.5/self_attn/MatMul"MatMul (/blocks.5/self_attn/Constant_56_output_0/blocks.5/self_attn/Constant_56"Constant*A value*5B+/blocks.5/self_attn/Constant_56_attr::valueJ5A  #/blocks.5/self_attn/MatMul_output_0 (/blocks.5/self_attn/Constant_56_output_0"/blocks.5/self_attn/Div_2_output_0/blocks.5/self_attn/Div_2"Div x "/blocks.5/self_attn/Div_2_output_0 attention_mask"/blocks.5/self_attn/Add_2_output_0/blocks.5/self_attn/Add_2"Add  "/blocks.5/self_attn/Add_2_output_0$/blocks.5/self_attn/Softmax_output_0/blocks.5/self_attn/Softmax"Softmax* axis x $/blocks.5/self_attn/Softmax_output_0#/blocks.5/self_attn/Cast_4_output_0/blocks.5/self_attn/Cast_4"Cast* to  #/blocks.5/self_attn/Cast_4_output_0 &/blocks.5/self_attn/Reshape_6_output_0%/blocks.5/self_attn/MatMul_1_output_0/blocks.5/self_attn/MatMul_1"MatMul  %/blocks.5/self_attn/MatMul_1_output_0(/blocks.5/self_attn/Transpose_3_output_0/blocks.5/self_attn/Transpose_3" Transpose* perm@@@@ fonnx::Unsqueeze_2053 Constant_4075"Constant*5 value*)BConstant_4075_attr::valueJ  #/blocks.5/self_attn/Gather_output_0 onnx::Unsqueeze_2053)/blocks.5/self_attn/Unsqueeze_30_output_0 /blocks.5/self_attn/Unsqueeze_30" Unsqueeze fonnx::Unsqueeze_2055 Constant_4077"Constant*5 value*)BConstant_4077_attr::valueJ  %/blocks.5/self_attn/Gather_1_output_0 onnx::Unsqueeze_2055)/blocks.5/self_attn/Unsqueeze_31_output_0 /blocks.5/self_attn/Unsqueeze_31" Unsqueeze (/blocks.5/self_attn/Constant_57_output_0/blocks.5/self_attn/Constant_57"Constant*G value*;B+/blocks.5/self_attn/Constant_57_attr::valueJ  )/blocks.5/self_attn/Unsqueeze_30_output_0 )/blocks.5/self_attn/Unsqueeze_31_output_0 (/blocks.5/self_attn/Constant_57_output_0&/blocks.5/self_attn/Concat_12_output_0/blocks.5/self_attn/Concat_12"Concat* axis  (/blocks.5/self_attn/Transpose_3_output_0 &/blocks.5/self_attn/Concat_12_output_0&/blocks.5/self_attn/Reshape_7_output_0/blocks.5/self_attn/Reshape_7"Reshape* allowzero  &/blocks.5/self_attn/Reshape_7_output_0 onnx::MatMul_8729*/blocks.5/self_attn/o_proj/MatMul_output_0!/blocks.5/self_attn/o_proj/MatMul"MatMul  )/blocks.5/input_layernorm/Cast_1_output_0 */blocks.5/self_attn/o_proj/MatMul_output_0/blocks.5/Add_output_0 /blocks.5/Add"Add  /blocks.5/Add_output_00/blocks.5/post_attention_layernorm/Cast_output_0'/blocks.5/post_attention_layernorm/Cast"Cast* to 4/blocks.5/post_attention_layernorm/Constant_output_0+/blocks.5/post_attention_layernorm/Constant"Constant*M value*AB7/blocks.5/post_attention_layernorm/Constant_attr::valueJ@  0/blocks.5/post_attention_layernorm/Cast_output_0 4/blocks.5/post_attention_layernorm/Constant_output_0//blocks.5/post_attention_layernorm/Pow_output_0&/blocks.5/post_attention_layernorm/Pow"Pow  //blocks.5/post_attention_layernorm/Pow_output_06/blocks.5/post_attention_layernorm/ReduceMean_output_0-/blocks.5/post_attention_layernorm/ReduceMean" ReduceMean* axes@* keepdims 6/blocks.5/post_attention_layernorm/Constant_1_output_0-/blocks.5/post_attention_layernorm/Constant_1"Constant*O value*CB9/blocks.5/post_attention_layernorm/Constant_1_attr::valueJ75  6/blocks.5/post_attention_layernorm/ReduceMean_output_0 6/blocks.5/post_attention_layernorm/Constant_1_output_0//blocks.5/post_attention_layernorm/Add_output_0&/blocks.5/post_attention_layernorm/Add"Add  //blocks.5/post_attention_layernorm/Add_output_00/blocks.5/post_attention_layernorm/Sqrt_output_0'/blocks.5/post_attention_layernorm/Sqrt"Sqrt 6/blocks.5/post_attention_layernorm/Constant_2_output_0-/blocks.5/post_attention_layernorm/Constant_2"Constant*O value*CB9/blocks.5/post_attention_layernorm/Constant_2_attr::valueJ?  6/blocks.5/post_attention_layernorm/Constant_2_output_0 0/blocks.5/post_attention_layernorm/Sqrt_output_0//blocks.5/post_attention_layernorm/Div_output_0&/blocks.5/post_attention_layernorm/Div"Div  0/blocks.5/post_attention_layernorm/Cast_output_02/blocks.5/post_attention_layernorm/Cast_1_output_0)/blocks.5/post_attention_layernorm/Cast_1"Cast* to  2/blocks.5/post_attention_layernorm/Cast_1_output_0 //blocks.5/post_attention_layernorm/Div_output_0//blocks.5/post_attention_layernorm/Mul_output_0&/blocks.5/post_attention_layernorm/Mul"Mul  //blocks.5/post_attention_layernorm/Mul_output_0 (blocks.5.post_attention_layernorm.weight1/blocks.5/post_attention_layernorm/Mul_1_output_0(/blocks.5/post_attention_layernorm/Mul_1"Mul  1/blocks.5/post_attention_layernorm/Mul_1_output_02/blocks.5/post_attention_layernorm/Cast_2_output_0)/blocks.5/post_attention_layernorm/Cast_2"Cast* to  2/blocks.5/post_attention_layernorm/Cast_2_output_0 onnx::MatMul_8730'/blocks.5/mlp/gate_proj/MatMul_output_0/blocks.5/mlp/gate_proj/MatMul"MatMul w '/blocks.5/mlp/gate_proj/MatMul_output_0%/blocks.5/mlp/act_fn/Sigmoid_output_0/blocks.5/mlp/act_fn/Sigmoid"Sigmoid  '/blocks.5/mlp/gate_proj/MatMul_output_0 %/blocks.5/mlp/act_fn/Sigmoid_output_0!/blocks.5/mlp/act_fn/Mul_output_0/blocks.5/mlp/act_fn/Mul"Mul  2/blocks.5/post_attention_layernorm/Cast_2_output_0 onnx::MatMul_8731%/blocks.5/mlp/up_proj/MatMul_output_0/blocks.5/mlp/up_proj/MatMul"MatMul ~ !/blocks.5/mlp/act_fn/Mul_output_0 %/blocks.5/mlp/up_proj/MatMul_output_0/blocks.5/mlp/Mul_output_0/blocks.5/mlp/Mul"Mul  /blocks.5/mlp/Mul_output_0 onnx::MatMul_8732'/blocks.5/mlp/down_proj/MatMul_output_0/blocks.5/mlp/down_proj/MatMul"MatMul  2/blocks.5/post_attention_layernorm/Cast_1_output_0 '/blocks.5/mlp/down_proj/MatMul_output_0/blocks.5/Add_1_output_0/blocks.5/Add_1"Add ` past_key_values /rotary/Constant_output_0/Gather_6_output_0 /Gather_6"Gather* axis /blocks.6/Constant_output_0/blocks.6/Constant"Constant*J value*>B/blocks.6/Constant_attr::valueJ  /blocks.5/Add_1_output_0 /blocks.6/Constant_output_0/blocks.6/Reshape_output_0/blocks.6/Reshape"Reshape* allowzero v /blocks.6/Reshape_output_0'/blocks.6/input_layernorm/Cast_output_0/blocks.6/input_layernorm/Cast"Cast* to +/blocks.6/input_layernorm/Constant_output_0"/blocks.6/input_layernorm/Constant"Constant*D value*8B./blocks.6/input_layernorm/Constant_attr::valueJ@  '/blocks.6/input_layernorm/Cast_output_0 +/blocks.6/input_layernorm/Constant_output_0&/blocks.6/input_layernorm/Pow_output_0/blocks.6/input_layernorm/Pow"Pow  &/blocks.6/input_layernorm/Pow_output_0-/blocks.6/input_layernorm/ReduceMean_output_0$/blocks.6/input_layernorm/ReduceMean" ReduceMean* axes@* keepdims -/blocks.6/input_layernorm/Constant_1_output_0$/blocks.6/input_layernorm/Constant_1"Constant*F value*:B0/blocks.6/input_layernorm/Constant_1_attr::valueJ75  -/blocks.6/input_layernorm/ReduceMean_output_0 -/blocks.6/input_layernorm/Constant_1_output_0&/blocks.6/input_layernorm/Add_output_0/blocks.6/input_layernorm/Add"Add w &/blocks.6/input_layernorm/Add_output_0'/blocks.6/input_layernorm/Sqrt_output_0/blocks.6/input_layernorm/Sqrt"Sqrt -/blocks.6/input_layernorm/Constant_2_output_0$/blocks.6/input_layernorm/Constant_2"Constant*F value*:B0/blocks.6/input_layernorm/Constant_2_attr::valueJ?  -/blocks.6/input_layernorm/Constant_2_output_0 '/blocks.6/input_layernorm/Sqrt_output_0&/blocks.6/input_layernorm/Div_output_0/blocks.6/input_layernorm/Div"Div  '/blocks.6/input_layernorm/Cast_output_0)/blocks.6/input_layernorm/Cast_1_output_0 /blocks.6/input_layernorm/Cast_1"Cast* to  )/blocks.6/input_layernorm/Cast_1_output_0 &/blocks.6/input_layernorm/Div_output_0&/blocks.6/input_layernorm/Mul_output_0/blocks.6/input_layernorm/Mul"Mul  &/blocks.6/input_layernorm/Mul_output_0 blocks.6.input_layernorm.weight(/blocks.6/input_layernorm/Mul_1_output_0/blocks.6/input_layernorm/Mul_1"Mul  (/blocks.6/input_layernorm/Mul_1_output_0)/blocks.6/input_layernorm/Cast_2_output_0 /blocks.6/input_layernorm/Cast_2"Cast* to q )/blocks.6/input_layernorm/Cast_2_output_0"/blocks.6/self_attn/Shape_output_0/blocks.6/self_attn/Shape"Shape %/blocks.6/self_attn/Constant_output_0/blocks.6/self_attn/Constant"Constant*B value*6B(/blocks.6/self_attn/Constant_attr::valueJ  "/blocks.6/self_attn/Shape_output_0 %/blocks.6/self_attn/Constant_output_0#/blocks.6/self_attn/Gather_output_0/blocks.6/self_attn/Gather"Gather* axis u )/blocks.6/input_layernorm/Cast_2_output_0$/blocks.6/self_attn/Shape_1_output_0/blocks.6/self_attn/Shape_1"Shape '/blocks.6/self_attn/Constant_1_output_0/blocks.6/self_attn/Constant_1"Constant*D value*8B*/blocks.6/self_attn/Constant_1_attr::valueJ  $/blocks.6/self_attn/Shape_1_output_0 '/blocks.6/self_attn/Constant_1_output_0%/blocks.6/self_attn/Gather_1_output_0/blocks.6/self_attn/Gather_1"Gather* axis  )/blocks.6/input_layernorm/Cast_2_output_0 onnx::MatMul_8733*/blocks.6/self_attn/q_proj/MatMul_output_0!/blocks.6/self_attn/q_proj/MatMul"MatMul  )/blocks.6/input_layernorm/Cast_2_output_0 onnx::MatMul_8734*/blocks.6/self_attn/k_proj/MatMul_output_0!/blocks.6/self_attn/k_proj/MatMul"MatMul  )/blocks.6/input_layernorm/Cast_2_output_0 onnx::MatMul_8735*/blocks.6/self_attn/v_proj/MatMul_output_0!/blocks.6/self_attn/v_proj/MatMul"MatMul fonnx::Unsqueeze_2115 Constant_4129"Constant*5 value*)BConstant_4129_attr::valueJ  #/blocks.6/self_attn/Gather_output_0 onnx::Unsqueeze_2115&/blocks.6/self_attn/Unsqueeze_output_0/blocks.6/self_attn/Unsqueeze" Unsqueeze fonnx::Unsqueeze_2117 Constant_4131"Constant*5 value*)BConstant_4131_attr::valueJ  %/blocks.6/self_attn/Gather_1_output_0 onnx::Unsqueeze_2117(/blocks.6/self_attn/Unsqueeze_1_output_0/blocks.6/self_attn/Unsqueeze_1" Unsqueeze '/blocks.6/self_attn/Constant_2_output_0/blocks.6/self_attn/Constant_2"Constant*F value*:B*/blocks.6/self_attn/Constant_2_attr::valueJ '/blocks.6/self_attn/Constant_3_output_0/blocks.6/self_attn/Constant_3"Constant*F value*:B*/blocks.6/self_attn/Constant_3_attr::valueJ  &/blocks.6/self_attn/Unsqueeze_output_0 (/blocks.6/self_attn/Unsqueeze_1_output_0 '/blocks.6/self_attn/Constant_2_output_0 '/blocks.6/self_attn/Constant_3_output_0#/blocks.6/self_attn/Concat_output_0/blocks.6/self_attn/Concat"Concat* axis  */blocks.6/self_attn/q_proj/MatMul_output_0 #/blocks.6/self_attn/Concat_output_0$/blocks.6/self_attn/Reshape_output_0/blocks.6/self_attn/Reshape"Reshape* allowzero fonnx::Unsqueeze_2125 Constant_4137"Constant*5 value*)BConstant_4137_attr::valueJ  #/blocks.6/self_attn/Gather_output_0 onnx::Unsqueeze_2125(/blocks.6/self_attn/Unsqueeze_2_output_0/blocks.6/self_attn/Unsqueeze_2" Unsqueeze fonnx::Unsqueeze_2127 Constant_4139"Constant*5 value*)BConstant_4139_attr::valueJ  %/blocks.6/self_attn/Gather_1_output_0 onnx::Unsqueeze_2127(/blocks.6/self_attn/Unsqueeze_3_output_0/blocks.6/self_attn/Unsqueeze_3" Unsqueeze '/blocks.6/self_attn/Constant_4_output_0/blocks.6/self_attn/Constant_4"Constant*F value*:B*/blocks.6/self_attn/Constant_4_attr::valueJ '/blocks.6/self_attn/Constant_5_output_0/blocks.6/self_attn/Constant_5"Constant*F value*:B*/blocks.6/self_attn/Constant_5_attr::valueJ  (/blocks.6/self_attn/Unsqueeze_2_output_0 (/blocks.6/self_attn/Unsqueeze_3_output_0 '/blocks.6/self_attn/Constant_4_output_0 '/blocks.6/self_attn/Constant_5_output_0%/blocks.6/self_attn/Concat_1_output_0/blocks.6/self_attn/Concat_1"Concat* axis fonnx::Unsqueeze_2134 Constant_4144"Constant*5 value*)BConstant_4144_attr::valueJ  #/blocks.6/self_attn/Gather_output_0 onnx::Unsqueeze_2134(/blocks.6/self_attn/Unsqueeze_4_output_0/blocks.6/self_attn/Unsqueeze_4" Unsqueeze fonnx::Unsqueeze_2136 Constant_4146"Constant*5 value*)BConstant_4146_attr::valueJ  %/blocks.6/self_attn/Gather_1_output_0 onnx::Unsqueeze_2136(/blocks.6/self_attn/Unsqueeze_5_output_0/blocks.6/self_attn/Unsqueeze_5" Unsqueeze '/blocks.6/self_attn/Constant_6_output_0/blocks.6/self_attn/Constant_6"Constant*F value*:B*/blocks.6/self_attn/Constant_6_attr::valueJ '/blocks.6/self_attn/Constant_7_output_0/blocks.6/self_attn/Constant_7"Constant*F value*:B*/blocks.6/self_attn/Constant_7_attr::valueJ  (/blocks.6/self_attn/Unsqueeze_4_output_0 (/blocks.6/self_attn/Unsqueeze_5_output_0 '/blocks.6/self_attn/Constant_6_output_0 '/blocks.6/self_attn/Constant_7_output_0%/blocks.6/self_attn/Concat_2_output_0/blocks.6/self_attn/Concat_2"Concat* axis  */blocks.6/self_attn/k_proj/MatMul_output_0 %/blocks.6/self_attn/Concat_1_output_0&/blocks.6/self_attn/Reshape_1_output_0/blocks.6/self_attn/Reshape_1"Reshape* allowzero  */blocks.6/self_attn/v_proj/MatMul_output_0 %/blocks.6/self_attn/Concat_2_output_0&/blocks.6/self_attn/Reshape_2_output_0/blocks.6/self_attn/Reshape_2"Reshape* allowzero  $/blocks.6/self_attn/Reshape_output_0(/blocks.6/self_attn/q_norm/Cast_output_0/blocks.6/self_attn/q_norm/Cast"Cast* to ,/blocks.6/self_attn/q_norm/Constant_output_0#/blocks.6/self_attn/q_norm/Constant"Constant*E value*9B//blocks.6/self_attn/q_norm/Constant_attr::valueJ@  (/blocks.6/self_attn/q_norm/Cast_output_0 ,/blocks.6/self_attn/q_norm/Constant_output_0'/blocks.6/self_attn/q_norm/Pow_output_0/blocks.6/self_attn/q_norm/Pow"Pow  '/blocks.6/self_attn/q_norm/Pow_output_0./blocks.6/self_attn/q_norm/ReduceMean_output_0%/blocks.6/self_attn/q_norm/ReduceMean" ReduceMean* axes@* keepdims ./blocks.6/self_attn/q_norm/Constant_1_output_0%/blocks.6/self_attn/q_norm/Constant_1"Constant*G value*;B1/blocks.6/self_attn/q_norm/Constant_1_attr::valueJ75  ./blocks.6/self_attn/q_norm/ReduceMean_output_0 ./blocks.6/self_attn/q_norm/Constant_1_output_0'/blocks.6/self_attn/q_norm/Add_output_0/blocks.6/self_attn/q_norm/Add"Add z '/blocks.6/self_attn/q_norm/Add_output_0(/blocks.6/self_attn/q_norm/Sqrt_output_0/blocks.6/self_attn/q_norm/Sqrt"Sqrt ./blocks.6/self_attn/q_norm/Constant_2_output_0%/blocks.6/self_attn/q_norm/Constant_2"Constant*G value*;B1/blocks.6/self_attn/q_norm/Constant_2_attr::valueJ?  ./blocks.6/self_attn/q_norm/Constant_2_output_0 (/blocks.6/self_attn/q_norm/Sqrt_output_0'/blocks.6/self_attn/q_norm/Div_output_0/blocks.6/self_attn/q_norm/Div"Div  (/blocks.6/self_attn/q_norm/Cast_output_0*/blocks.6/self_attn/q_norm/Cast_1_output_0!/blocks.6/self_attn/q_norm/Cast_1"Cast* to  */blocks.6/self_attn/q_norm/Cast_1_output_0 '/blocks.6/self_attn/q_norm/Div_output_0'/blocks.6/self_attn/q_norm/Mul_output_0/blocks.6/self_attn/q_norm/Mul"Mul  '/blocks.6/self_attn/q_norm/Mul_output_0 blocks.6.self_attn.q_norm.weight)/blocks.6/self_attn/q_norm/Mul_1_output_0 /blocks.6/self_attn/q_norm/Mul_1"Mul  )/blocks.6/self_attn/q_norm/Mul_1_output_0*/blocks.6/self_attn/q_norm/Cast_2_output_0!/blocks.6/self_attn/q_norm/Cast_2"Cast* to  &/blocks.6/self_attn/Reshape_1_output_0(/blocks.6/self_attn/k_norm/Cast_output_0/blocks.6/self_attn/k_norm/Cast"Cast* to ,/blocks.6/self_attn/k_norm/Constant_output_0#/blocks.6/self_attn/k_norm/Constant"Constant*E value*9B//blocks.6/self_attn/k_norm/Constant_attr::valueJ@  (/blocks.6/self_attn/k_norm/Cast_output_0 ,/blocks.6/self_attn/k_norm/Constant_output_0'/blocks.6/self_attn/k_norm/Pow_output_0/blocks.6/self_attn/k_norm/Pow"Pow  '/blocks.6/self_attn/k_norm/Pow_output_0./blocks.6/self_attn/k_norm/ReduceMean_output_0%/blocks.6/self_attn/k_norm/ReduceMean" ReduceMean* axes@* keepdims ./blocks.6/self_attn/k_norm/Constant_1_output_0%/blocks.6/self_attn/k_norm/Constant_1"Constant*G value*;B1/blocks.6/self_attn/k_norm/Constant_1_attr::valueJ75  ./blocks.6/self_attn/k_norm/ReduceMean_output_0 ./blocks.6/self_attn/k_norm/Constant_1_output_0'/blocks.6/self_attn/k_norm/Add_output_0/blocks.6/self_attn/k_norm/Add"Add z '/blocks.6/self_attn/k_norm/Add_output_0(/blocks.6/self_attn/k_norm/Sqrt_output_0/blocks.6/self_attn/k_norm/Sqrt"Sqrt ./blocks.6/self_attn/k_norm/Constant_2_output_0%/blocks.6/self_attn/k_norm/Constant_2"Constant*G value*;B1/blocks.6/self_attn/k_norm/Constant_2_attr::valueJ?  ./blocks.6/self_attn/k_norm/Constant_2_output_0 (/blocks.6/self_attn/k_norm/Sqrt_output_0'/blocks.6/self_attn/k_norm/Div_output_0/blocks.6/self_attn/k_norm/Div"Div  (/blocks.6/self_attn/k_norm/Cast_output_0*/blocks.6/self_attn/k_norm/Cast_1_output_0!/blocks.6/self_attn/k_norm/Cast_1"Cast* to  */blocks.6/self_attn/k_norm/Cast_1_output_0 '/blocks.6/self_attn/k_norm/Div_output_0'/blocks.6/self_attn/k_norm/Mul_output_0/blocks.6/self_attn/k_norm/Mul"Mul  '/blocks.6/self_attn/k_norm/Mul_output_0 blocks.6.self_attn.k_norm.weight)/blocks.6/self_attn/k_norm/Mul_1_output_0 /blocks.6/self_attn/k_norm/Mul_1"Mul  )/blocks.6/self_attn/k_norm/Mul_1_output_0*/blocks.6/self_attn/k_norm/Cast_2_output_0!/blocks.6/self_attn/k_norm/Cast_2"Cast* to  */blocks.6/self_attn/q_norm/Cast_2_output_0 %/blocks.0/self_attn/Gather_2_output_0 /blocks.6/self_attn/Mul_output_0/blocks.6/self_attn/Mul"Mul v */blocks.6/self_attn/q_norm/Cast_2_output_0$/blocks.6/self_attn/Shape_2_output_0/blocks.6/self_attn/Shape_2"Shape '/blocks.6/self_attn/Constant_8_output_0/blocks.6/self_attn/Constant_8"Constant*D value*8B*/blocks.6/self_attn/Constant_8_attr::valueJ  $/blocks.6/self_attn/Shape_2_output_0 '/blocks.6/self_attn/Constant_8_output_0%/blocks.6/self_attn/Gather_2_output_0/blocks.6/self_attn/Gather_2"Gather* axis '/blocks.6/self_attn/Constant_9_output_0/blocks.6/self_attn/Constant_9"Constant*D value*8B*/blocks.6/self_attn/Constant_9_attr::valueJ  %/blocks.6/self_attn/Gather_2_output_0 '/blocks.6/self_attn/Constant_9_output_0 /blocks.6/self_attn/Div_output_0/blocks.6/self_attn/Div"Div p /blocks.6/self_attn/Div_output_0!/blocks.6/self_attn/Cast_output_0/blocks.6/self_attn/Cast"Cast* to u !/blocks.6/self_attn/Cast_output_0#/blocks.6/self_attn/Cast_1_output_0/blocks.6/self_attn/Cast_1"Cast* to (/blocks.6/self_attn/Constant_10_output_0/blocks.6/self_attn/Constant_10"Constant*G value*;B+/blocks.6/self_attn/Constant_10_attr::valueJ (/blocks.6/self_attn/Constant_11_output_0/blocks.6/self_attn/Constant_11"Constant*G value*;B+/blocks.6/self_attn/Constant_11_attr::valueJ (/blocks.6/self_attn/Constant_12_output_0/blocks.6/self_attn/Constant_12"Constant*G value*;B+/blocks.6/self_attn/Constant_12_attr::valueJ  #/blocks.6/self_attn/Cast_1_output_0 (/blocks.6/self_attn/Constant_12_output_0(/blocks.6/self_attn/Unsqueeze_6_output_0/blocks.6/self_attn/Unsqueeze_6" Unsqueeze (/blocks.6/self_attn/Constant_13_output_0/blocks.6/self_attn/Constant_13"Constant*G value*;B+/blocks.6/self_attn/Constant_13_attr::valueJ  */blocks.6/self_attn/q_norm/Cast_2_output_0 (/blocks.6/self_attn/Constant_11_output_0 (/blocks.6/self_attn/Unsqueeze_6_output_0 (/blocks.6/self_attn/Constant_10_output_0 (/blocks.6/self_attn/Constant_13_output_0"/blocks.6/self_attn/Slice_output_0/blocks.6/self_attn/Slice"Slice (/blocks.6/self_attn/Constant_14_output_0/blocks.6/self_attn/Constant_14"Constant*G value*;B+/blocks.6/self_attn/Constant_14_attr::valueJ (/blocks.6/self_attn/Constant_15_output_0/blocks.6/self_attn/Constant_15"Constant*G value*;B+/blocks.6/self_attn/Constant_15_attr::valueJ  #/blocks.6/self_attn/Cast_1_output_0 (/blocks.6/self_attn/Constant_15_output_0(/blocks.6/self_attn/Unsqueeze_7_output_0/blocks.6/self_attn/Unsqueeze_7" Unsqueeze (/blocks.6/self_attn/Constant_16_output_0/blocks.6/self_attn/Constant_16"Constant*G value*;B+/blocks.6/self_attn/Constant_16_attr::valueJ (/blocks.6/self_attn/Constant_17_output_0/blocks.6/self_attn/Constant_17"Constant*G value*;B+/blocks.6/self_attn/Constant_17_attr::valueJ  */blocks.6/self_attn/q_norm/Cast_2_output_0 (/blocks.6/self_attn/Unsqueeze_7_output_0 (/blocks.6/self_attn/Constant_16_output_0 (/blocks.6/self_attn/Constant_14_output_0 (/blocks.6/self_attn/Constant_17_output_0$/blocks.6/self_attn/Slice_1_output_0/blocks.6/self_attn/Slice_1"Slice f $/blocks.6/self_attn/Slice_1_output_0 /blocks.6/self_attn/Neg_output_0/blocks.6/self_attn/Neg"Neg  /blocks.6/self_attn/Neg_output_0 "/blocks.6/self_attn/Slice_output_0%/blocks.6/self_attn/Concat_3_output_0/blocks.6/self_attn/Concat_3"Concat* axis  %/blocks.6/self_attn/Concat_3_output_0 %/blocks.0/self_attn/Gather_3_output_0"/blocks.6/self_attn/Mul_1_output_0/blocks.6/self_attn/Mul_1"Mul  /blocks.6/self_attn/Mul_output_0 "/blocks.6/self_attn/Mul_1_output_0 /blocks.6/self_attn/Add_output_0/blocks.6/self_attn/Add"Add  */blocks.6/self_attn/k_norm/Cast_2_output_0 %/blocks.0/self_attn/Gather_2_output_0"/blocks.6/self_attn/Mul_2_output_0/blocks.6/self_attn/Mul_2"Mul v */blocks.6/self_attn/k_norm/Cast_2_output_0$/blocks.6/self_attn/Shape_3_output_0/blocks.6/self_attn/Shape_3"Shape (/blocks.6/self_attn/Constant_18_output_0/blocks.6/self_attn/Constant_18"Constant*E value*9B+/blocks.6/self_attn/Constant_18_attr::valueJ  $/blocks.6/self_attn/Shape_3_output_0 (/blocks.6/self_attn/Constant_18_output_0%/blocks.6/self_attn/Gather_3_output_0/blocks.6/self_attn/Gather_3"Gather* axis (/blocks.6/self_attn/Constant_19_output_0/blocks.6/self_attn/Constant_19"Constant*E value*9B+/blocks.6/self_attn/Constant_19_attr::valueJ  %/blocks.6/self_attn/Gather_3_output_0 (/blocks.6/self_attn/Constant_19_output_0"/blocks.6/self_attn/Div_1_output_0/blocks.6/self_attn/Div_1"Div v "/blocks.6/self_attn/Div_1_output_0#/blocks.6/self_attn/Cast_2_output_0/blocks.6/self_attn/Cast_2"Cast* to w #/blocks.6/self_attn/Cast_2_output_0#/blocks.6/self_attn/Cast_3_output_0/blocks.6/self_attn/Cast_3"Cast* to (/blocks.6/self_attn/Constant_20_output_0/blocks.6/self_attn/Constant_20"Constant*G value*;B+/blocks.6/self_attn/Constant_20_attr::valueJ (/blocks.6/self_attn/Constant_21_output_0/blocks.6/self_attn/Constant_21"Constant*G value*;B+/blocks.6/self_attn/Constant_21_attr::valueJ (/blocks.6/self_attn/Constant_22_output_0/blocks.6/self_attn/Constant_22"Constant*G value*;B+/blocks.6/self_attn/Constant_22_attr::valueJ  #/blocks.6/self_attn/Cast_3_output_0 (/blocks.6/self_attn/Constant_22_output_0(/blocks.6/self_attn/Unsqueeze_8_output_0/blocks.6/self_attn/Unsqueeze_8" Unsqueeze (/blocks.6/self_attn/Constant_23_output_0/blocks.6/self_attn/Constant_23"Constant*G value*;B+/blocks.6/self_attn/Constant_23_attr::valueJ  */blocks.6/self_attn/k_norm/Cast_2_output_0 (/blocks.6/self_attn/Constant_21_output_0 (/blocks.6/self_attn/Unsqueeze_8_output_0 (/blocks.6/self_attn/Constant_20_output_0 (/blocks.6/self_attn/Constant_23_output_0$/blocks.6/self_attn/Slice_2_output_0/blocks.6/self_attn/Slice_2"Slice (/blocks.6/self_attn/Constant_24_output_0/blocks.6/self_attn/Constant_24"Constant*G value*;B+/blocks.6/self_attn/Constant_24_attr::valueJ (/blocks.6/self_attn/Constant_25_output_0/blocks.6/self_attn/Constant_25"Constant*G value*;B+/blocks.6/self_attn/Constant_25_attr::valueJ  #/blocks.6/self_attn/Cast_3_output_0 (/blocks.6/self_attn/Constant_25_output_0(/blocks.6/self_attn/Unsqueeze_9_output_0/blocks.6/self_attn/Unsqueeze_9" Unsqueeze (/blocks.6/self_attn/Constant_26_output_0/blocks.6/self_attn/Constant_26"Constant*G value*;B+/blocks.6/self_attn/Constant_26_attr::valueJ (/blocks.6/self_attn/Constant_27_output_0/blocks.6/self_attn/Constant_27"Constant*G value*;B+/blocks.6/self_attn/Constant_27_attr::valueJ  */blocks.6/self_attn/k_norm/Cast_2_output_0 (/blocks.6/self_attn/Unsqueeze_9_output_0 (/blocks.6/self_attn/Constant_26_output_0 (/blocks.6/self_attn/Constant_24_output_0 (/blocks.6/self_attn/Constant_27_output_0$/blocks.6/self_attn/Slice_3_output_0/blocks.6/self_attn/Slice_3"Slice j $/blocks.6/self_attn/Slice_3_output_0"/blocks.6/self_attn/Neg_1_output_0/blocks.6/self_attn/Neg_1"Neg  "/blocks.6/self_attn/Neg_1_output_0 $/blocks.6/self_attn/Slice_2_output_0%/blocks.6/self_attn/Concat_4_output_0/blocks.6/self_attn/Concat_4"Concat* axis  %/blocks.6/self_attn/Concat_4_output_0 %/blocks.0/self_attn/Gather_3_output_0"/blocks.6/self_attn/Mul_3_output_0/blocks.6/self_attn/Mul_3"Mul  "/blocks.6/self_attn/Mul_2_output_0 "/blocks.6/self_attn/Mul_3_output_0"/blocks.6/self_attn/Add_1_output_0/blocks.6/self_attn/Add_1"Add  /Gather_6_output_0 /rotary/Constant_3_output_0%/blocks.6/self_attn/Gather_4_output_0/blocks.6/self_attn/Gather_4"Gather* axis  /Gather_6_output_0 /rotary/Constant_8_output_0%/blocks.6/self_attn/Gather_5_output_0/blocks.6/self_attn/Gather_5"Gather* axis  %/blocks.6/self_attn/Gather_4_output_0 "/blocks.6/self_attn/Add_1_output_0%/blocks.6/self_attn/Concat_5_output_0/blocks.6/self_attn/Concat_5"Concat* axis  %/blocks.6/self_attn/Gather_5_output_0 &/blocks.6/self_attn/Reshape_2_output_0%/blocks.6/self_attn/Concat_6_output_0/blocks.6/self_attn/Concat_6"Concat* axis (/blocks.6/self_attn/Constant_28_output_0/blocks.6/self_attn/Constant_28"Constant*G value*;B+/blocks.6/self_attn/Constant_28_attr::valueJ  %/blocks.6/self_attn/Concat_5_output_0 (/blocks.6/self_attn/Constant_28_output_0)/blocks.6/self_attn/Unsqueeze_10_output_0 /blocks.6/self_attn/Unsqueeze_10" Unsqueeze (/blocks.6/self_attn/Constant_29_output_0/blocks.6/self_attn/Constant_29"Constant*G value*;B+/blocks.6/self_attn/Constant_29_attr::valueJ  %/blocks.6/self_attn/Concat_6_output_0 (/blocks.6/self_attn/Constant_29_output_0)/blocks.6/self_attn/Unsqueeze_11_output_0 /blocks.6/self_attn/Unsqueeze_11" Unsqueeze  )/blocks.6/self_attn/Unsqueeze_10_output_0 )/blocks.6/self_attn/Unsqueeze_11_output_0%/blocks.6/self_attn/Concat_7_output_0/blocks.6/self_attn/Concat_7"Concat* axis  /blocks.6/self_attn/Add_output_0&/blocks.6/self_attn/Transpose_output_0/blocks.6/self_attn/Transpose" Transpose* perm@@@@  %/blocks.6/self_attn/Concat_5_output_0(/blocks.6/self_attn/Transpose_1_output_0/blocks.6/self_attn/Transpose_1" Transpose* perm@@@@  %/blocks.6/self_attn/Concat_6_output_0(/blocks.6/self_attn/Transpose_2_output_0/blocks.6/self_attn/Transpose_2" Transpose* perm@@@@ t (/blocks.6/self_attn/Transpose_1_output_0$/blocks.6/self_attn/Shape_4_output_0/blocks.6/self_attn/Shape_4"Shape (/blocks.6/self_attn/Constant_30_output_0/blocks.6/self_attn/Constant_30"Constant*E value*9B+/blocks.6/self_attn/Constant_30_attr::valueJ  $/blocks.6/self_attn/Shape_4_output_0 (/blocks.6/self_attn/Constant_30_output_0%/blocks.6/self_attn/Gather_6_output_0/blocks.6/self_attn/Gather_6"Gather* axis t (/blocks.6/self_attn/Transpose_1_output_0$/blocks.6/self_attn/Shape_5_output_0/blocks.6/self_attn/Shape_5"Shape (/blocks.6/self_attn/Constant_31_output_0/blocks.6/self_attn/Constant_31"Constant*E value*9B+/blocks.6/self_attn/Constant_31_attr::valueJ  $/blocks.6/self_attn/Shape_5_output_0 (/blocks.6/self_attn/Constant_31_output_0%/blocks.6/self_attn/Gather_7_output_0/blocks.6/self_attn/Gather_7"Gather* axis t (/blocks.6/self_attn/Transpose_1_output_0$/blocks.6/self_attn/Shape_6_output_0/blocks.6/self_attn/Shape_6"Shape (/blocks.6/self_attn/Constant_32_output_0/blocks.6/self_attn/Constant_32"Constant*E value*9B+/blocks.6/self_attn/Constant_32_attr::valueJ  $/blocks.6/self_attn/Shape_6_output_0 (/blocks.6/self_attn/Constant_32_output_0%/blocks.6/self_attn/Gather_8_output_0/blocks.6/self_attn/Gather_8"Gather* axis t (/blocks.6/self_attn/Transpose_1_output_0$/blocks.6/self_attn/Shape_7_output_0/blocks.6/self_attn/Shape_7"Shape (/blocks.6/self_attn/Constant_33_output_0/blocks.6/self_attn/Constant_33"Constant*E value*9B+/blocks.6/self_attn/Constant_33_attr::valueJ  $/blocks.6/self_attn/Shape_7_output_0 (/blocks.6/self_attn/Constant_33_output_0%/blocks.6/self_attn/Gather_9_output_0/blocks.6/self_attn/Gather_9"Gather* axis (/blocks.6/self_attn/Constant_34_output_0/blocks.6/self_attn/Constant_34"Constant*G value*;B+/blocks.6/self_attn/Constant_34_attr::valueJ  (/blocks.6/self_attn/Transpose_1_output_0 (/blocks.6/self_attn/Constant_34_output_0)/blocks.6/self_attn/Unsqueeze_12_output_0 /blocks.6/self_attn/Unsqueeze_12" Unsqueeze (/blocks.6/self_attn/Constant_35_output_0/blocks.6/self_attn/Constant_35"Constant*G value*;B+/blocks.6/self_attn/Constant_35_attr::valueJ  %/blocks.6/self_attn/Gather_6_output_0 (/blocks.6/self_attn/Constant_35_output_0)/blocks.6/self_attn/Unsqueeze_13_output_0 /blocks.6/self_attn/Unsqueeze_13" Unsqueeze (/blocks.6/self_attn/Constant_36_output_0/blocks.6/self_attn/Constant_36"Constant*G value*;B+/blocks.6/self_attn/Constant_36_attr::valueJ  %/blocks.6/self_attn/Gather_7_output_0 (/blocks.6/self_attn/Constant_36_output_0)/blocks.6/self_attn/Unsqueeze_14_output_0 /blocks.6/self_attn/Unsqueeze_14" Unsqueeze (/blocks.6/self_attn/Constant_37_output_0/blocks.6/self_attn/Constant_37"Constant*G value*;B+/blocks.6/self_attn/Constant_37_attr::valueJ (/blocks.6/self_attn/Constant_38_output_0/blocks.6/self_attn/Constant_38"Constant*G value*;B+/blocks.6/self_attn/Constant_38_attr::valueJ  %/blocks.6/self_attn/Gather_8_output_0 (/blocks.6/self_attn/Constant_38_output_0)/blocks.6/self_attn/Unsqueeze_15_output_0 /blocks.6/self_attn/Unsqueeze_15" Unsqueeze (/blocks.6/self_attn/Constant_39_output_0/blocks.6/self_attn/Constant_39"Constant*G value*;B+/blocks.6/self_attn/Constant_39_attr::valueJ  %/blocks.6/self_attn/Gather_9_output_0 (/blocks.6/self_attn/Constant_39_output_0)/blocks.6/self_attn/Unsqueeze_16_output_0 /blocks.6/self_attn/Unsqueeze_16" Unsqueeze  )/blocks.6/self_attn/Unsqueeze_13_output_0 )/blocks.6/self_attn/Unsqueeze_14_output_0 (/blocks.6/self_attn/Constant_37_output_0 )/blocks.6/self_attn/Unsqueeze_15_output_0 )/blocks.6/self_attn/Unsqueeze_16_output_0%/blocks.6/self_attn/Concat_8_output_0/blocks.6/self_attn/Concat_8"Concat* axis (/blocks.6/self_attn/Constant_40_output_0/blocks.6/self_attn/Constant_40"Constant*G value*;B+/blocks.6/self_attn/Constant_40_attr::valueJ  %/blocks.6/self_attn/Concat_8_output_0 (/blocks.6/self_attn/Constant_40_output_0&/blocks.6/self_attn/Reshape_3_output_0/blocks.6/self_attn/Reshape_3"Reshape* allowzero r &/blocks.6/self_attn/Reshape_3_output_0$/blocks.6/self_attn/Shape_8_output_0/blocks.6/self_attn/Shape_8"Shape  $/blocks.6/self_attn/Shape_8_output_0,/blocks.6/self_attn/ConstantOfShape_output_0#/blocks.6/self_attn/ConstantOfShape"ConstantOfShape*K value*?B//blocks.6/self_attn/ConstantOfShape_attr::valueJ (/blocks.6/self_attn/Constant_41_output_0/blocks.6/self_attn/Constant_41"Constant*E value*9B+/blocks.6/self_attn/Constant_41_attr::valueJ  ,/blocks.6/self_attn/ConstantOfShape_output_0 (/blocks.6/self_attn/Constant_41_output_0"/blocks.6/self_attn/Mul_4_output_0/blocks.6/self_attn/Mul_4"Mul  &/blocks.6/self_attn/Reshape_3_output_0 "/blocks.6/self_attn/Mul_4_output_0"/blocks.6/self_attn/Equal_output_0/blocks.6/self_attn/Equal"Equal  "/blocks.6/self_attn/Equal_output_0 ,/blocks.6/self_attn/ConstantOfShape_output_0 &/blocks.6/self_attn/Reshape_3_output_0"/blocks.6/self_attn/Where_output_0/blocks.6/self_attn/Where"Where  )/blocks.6/self_attn/Unsqueeze_12_output_0 "/blocks.6/self_attn/Where_output_0#/blocks.6/self_attn/Expand_output_0/blocks.6/self_attn/Expand"Expand (/blocks.6/self_attn/Constant_42_output_0/blocks.6/self_attn/Constant_42"Constant*E value*9B+/blocks.6/self_attn/Constant_42_attr::valueJ  %/blocks.6/self_attn/Gather_7_output_0 (/blocks.6/self_attn/Constant_42_output_0"/blocks.6/self_attn/Mul_5_output_0/blocks.6/self_attn/Mul_5"Mul fonnx::Unsqueeze_2279 Constant_4274"Constant*5 value*)BConstant_4274_attr::valueJ  %/blocks.6/self_attn/Gather_6_output_0 onnx::Unsqueeze_2279)/blocks.6/self_attn/Unsqueeze_17_output_0 /blocks.6/self_attn/Unsqueeze_17" Unsqueeze fonnx::Unsqueeze_2281 Constant_4276"Constant*5 value*)BConstant_4276_attr::valueJ  "/blocks.6/self_attn/Mul_5_output_0 onnx::Unsqueeze_2281)/blocks.6/self_attn/Unsqueeze_18_output_0 /blocks.6/self_attn/Unsqueeze_18" Unsqueeze fonnx::Unsqueeze_2283 Constant_4278"Constant*5 value*)BConstant_4278_attr::valueJ  %/blocks.6/self_attn/Gather_8_output_0 onnx::Unsqueeze_2283)/blocks.6/self_attn/Unsqueeze_19_output_0 /blocks.6/self_attn/Unsqueeze_19" Unsqueeze fonnx::Unsqueeze_2285 Constant_4280"Constant*5 value*)BConstant_4280_attr::valueJ  %/blocks.6/self_attn/Gather_9_output_0 onnx::Unsqueeze_2285)/blocks.6/self_attn/Unsqueeze_20_output_0 /blocks.6/self_attn/Unsqueeze_20" Unsqueeze  )/blocks.6/self_attn/Unsqueeze_17_output_0 )/blocks.6/self_attn/Unsqueeze_18_output_0 )/blocks.6/self_attn/Unsqueeze_19_output_0 )/blocks.6/self_attn/Unsqueeze_20_output_0%/blocks.6/self_attn/Concat_9_output_0/blocks.6/self_attn/Concat_9"Concat* axis  #/blocks.6/self_attn/Expand_output_0 %/blocks.6/self_attn/Concat_9_output_0&/blocks.6/self_attn/Reshape_4_output_0/blocks.6/self_attn/Reshape_4"Reshape* allowzero t (/blocks.6/self_attn/Transpose_2_output_0$/blocks.6/self_attn/Shape_9_output_0/blocks.6/self_attn/Shape_9"Shape (/blocks.6/self_attn/Constant_43_output_0/blocks.6/self_attn/Constant_43"Constant*E value*9B+/blocks.6/self_attn/Constant_43_attr::valueJ  $/blocks.6/self_attn/Shape_9_output_0 (/blocks.6/self_attn/Constant_43_output_0&/blocks.6/self_attn/Gather_10_output_0/blocks.6/self_attn/Gather_10"Gather* axis v (/blocks.6/self_attn/Transpose_2_output_0%/blocks.6/self_attn/Shape_10_output_0/blocks.6/self_attn/Shape_10"Shape (/blocks.6/self_attn/Constant_44_output_0/blocks.6/self_attn/Constant_44"Constant*E value*9B+/blocks.6/self_attn/Constant_44_attr::valueJ  %/blocks.6/self_attn/Shape_10_output_0 (/blocks.6/self_attn/Constant_44_output_0&/blocks.6/self_attn/Gather_11_output_0/blocks.6/self_attn/Gather_11"Gather* axis v (/blocks.6/self_attn/Transpose_2_output_0%/blocks.6/self_attn/Shape_11_output_0/blocks.6/self_attn/Shape_11"Shape (/blocks.6/self_attn/Constant_45_output_0/blocks.6/self_attn/Constant_45"Constant*E value*9B+/blocks.6/self_attn/Constant_45_attr::valueJ  %/blocks.6/self_attn/Shape_11_output_0 (/blocks.6/self_attn/Constant_45_output_0&/blocks.6/self_attn/Gather_12_output_0/blocks.6/self_attn/Gather_12"Gather* axis v (/blocks.6/self_attn/Transpose_2_output_0%/blocks.6/self_attn/Shape_12_output_0/blocks.6/self_attn/Shape_12"Shape (/blocks.6/self_attn/Constant_46_output_0/blocks.6/self_attn/Constant_46"Constant*E value*9B+/blocks.6/self_attn/Constant_46_attr::valueJ  %/blocks.6/self_attn/Shape_12_output_0 (/blocks.6/self_attn/Constant_46_output_0&/blocks.6/self_attn/Gather_13_output_0/blocks.6/self_attn/Gather_13"Gather* axis (/blocks.6/self_attn/Constant_47_output_0/blocks.6/self_attn/Constant_47"Constant*G value*;B+/blocks.6/self_attn/Constant_47_attr::valueJ  (/blocks.6/self_attn/Transpose_2_output_0 (/blocks.6/self_attn/Constant_47_output_0)/blocks.6/self_attn/Unsqueeze_21_output_0 /blocks.6/self_attn/Unsqueeze_21" Unsqueeze (/blocks.6/self_attn/Constant_48_output_0/blocks.6/self_attn/Constant_48"Constant*G value*;B+/blocks.6/self_attn/Constant_48_attr::valueJ  &/blocks.6/self_attn/Gather_10_output_0 (/blocks.6/self_attn/Constant_48_output_0)/blocks.6/self_attn/Unsqueeze_22_output_0 /blocks.6/self_attn/Unsqueeze_22" Unsqueeze (/blocks.6/self_attn/Constant_49_output_0/blocks.6/self_attn/Constant_49"Constant*G value*;B+/blocks.6/self_attn/Constant_49_attr::valueJ  &/blocks.6/self_attn/Gather_11_output_0 (/blocks.6/self_attn/Constant_49_output_0)/blocks.6/self_attn/Unsqueeze_23_output_0 /blocks.6/self_attn/Unsqueeze_23" Unsqueeze (/blocks.6/self_attn/Constant_50_output_0/blocks.6/self_attn/Constant_50"Constant*G value*;B+/blocks.6/self_attn/Constant_50_attr::valueJ (/blocks.6/self_attn/Constant_51_output_0/blocks.6/self_attn/Constant_51"Constant*G value*;B+/blocks.6/self_attn/Constant_51_attr::valueJ  &/blocks.6/self_attn/Gather_12_output_0 (/blocks.6/self_attn/Constant_51_output_0)/blocks.6/self_attn/Unsqueeze_24_output_0 /blocks.6/self_attn/Unsqueeze_24" Unsqueeze (/blocks.6/self_attn/Constant_52_output_0/blocks.6/self_attn/Constant_52"Constant*G value*;B+/blocks.6/self_attn/Constant_52_attr::valueJ  &/blocks.6/self_attn/Gather_13_output_0 (/blocks.6/self_attn/Constant_52_output_0)/blocks.6/self_attn/Unsqueeze_25_output_0 /blocks.6/self_attn/Unsqueeze_25" Unsqueeze  )/blocks.6/self_attn/Unsqueeze_22_output_0 )/blocks.6/self_attn/Unsqueeze_23_output_0 (/blocks.6/self_attn/Constant_50_output_0 )/blocks.6/self_attn/Unsqueeze_24_output_0 )/blocks.6/self_attn/Unsqueeze_25_output_0&/blocks.6/self_attn/Concat_10_output_0/blocks.6/self_attn/Concat_10"Concat* axis (/blocks.6/self_attn/Constant_53_output_0/blocks.6/self_attn/Constant_53"Constant*G value*;B+/blocks.6/self_attn/Constant_53_attr::valueJ  &/blocks.6/self_attn/Concat_10_output_0 (/blocks.6/self_attn/Constant_53_output_0&/blocks.6/self_attn/Reshape_5_output_0/blocks.6/self_attn/Reshape_5"Reshape* allowzero t &/blocks.6/self_attn/Reshape_5_output_0%/blocks.6/self_attn/Shape_13_output_0/blocks.6/self_attn/Shape_13"Shape  %/blocks.6/self_attn/Shape_13_output_0./blocks.6/self_attn/ConstantOfShape_1_output_0%/blocks.6/self_attn/ConstantOfShape_1"ConstantOfShape*M value*AB1/blocks.6/self_attn/ConstantOfShape_1_attr::valueJ (/blocks.6/self_attn/Constant_54_output_0/blocks.6/self_attn/Constant_54"Constant*E value*9B+/blocks.6/self_attn/Constant_54_attr::valueJ  ./blocks.6/self_attn/ConstantOfShape_1_output_0 (/blocks.6/self_attn/Constant_54_output_0"/blocks.6/self_attn/Mul_6_output_0/blocks.6/self_attn/Mul_6"Mul  &/blocks.6/self_attn/Reshape_5_output_0 "/blocks.6/self_attn/Mul_6_output_0$/blocks.6/self_attn/Equal_1_output_0/blocks.6/self_attn/Equal_1"Equal  $/blocks.6/self_attn/Equal_1_output_0 ./blocks.6/self_attn/ConstantOfShape_1_output_0 &/blocks.6/self_attn/Reshape_5_output_0$/blocks.6/self_attn/Where_1_output_0/blocks.6/self_attn/Where_1"Where  )/blocks.6/self_attn/Unsqueeze_21_output_0 $/blocks.6/self_attn/Where_1_output_0%/blocks.6/self_attn/Expand_1_output_0/blocks.6/self_attn/Expand_1"Expand (/blocks.6/self_attn/Constant_55_output_0/blocks.6/self_attn/Constant_55"Constant*E value*9B+/blocks.6/self_attn/Constant_55_attr::valueJ  &/blocks.6/self_attn/Gather_11_output_0 (/blocks.6/self_attn/Constant_55_output_0"/blocks.6/self_attn/Mul_7_output_0/blocks.6/self_attn/Mul_7"Mul fonnx::Unsqueeze_2325 Constant_4319"Constant*5 value*)BConstant_4319_attr::valueJ  &/blocks.6/self_attn/Gather_10_output_0 onnx::Unsqueeze_2325)/blocks.6/self_attn/Unsqueeze_26_output_0 /blocks.6/self_attn/Unsqueeze_26" Unsqueeze fonnx::Unsqueeze_2327 Constant_4321"Constant*5 value*)BConstant_4321_attr::valueJ  "/blocks.6/self_attn/Mul_7_output_0 onnx::Unsqueeze_2327)/blocks.6/self_attn/Unsqueeze_27_output_0 /blocks.6/self_attn/Unsqueeze_27" Unsqueeze fonnx::Unsqueeze_2329 Constant_4323"Constant*5 value*)BConstant_4323_attr::valueJ  &/blocks.6/self_attn/Gather_12_output_0 onnx::Unsqueeze_2329)/blocks.6/self_attn/Unsqueeze_28_output_0 /blocks.6/self_attn/Unsqueeze_28" Unsqueeze fonnx::Unsqueeze_2331 Constant_4325"Constant*5 value*)BConstant_4325_attr::valueJ  &/blocks.6/self_attn/Gather_13_output_0 onnx::Unsqueeze_2331)/blocks.6/self_attn/Unsqueeze_29_output_0 /blocks.6/self_attn/Unsqueeze_29" Unsqueeze  )/blocks.6/self_attn/Unsqueeze_26_output_0 )/blocks.6/self_attn/Unsqueeze_27_output_0 )/blocks.6/self_attn/Unsqueeze_28_output_0 )/blocks.6/self_attn/Unsqueeze_29_output_0&/blocks.6/self_attn/Concat_11_output_0/blocks.6/self_attn/Concat_11"Concat* axis  %/blocks.6/self_attn/Expand_1_output_0 &/blocks.6/self_attn/Concat_11_output_0&/blocks.6/self_attn/Reshape_6_output_0/blocks.6/self_attn/Reshape_6"Reshape* allowzero  &/blocks.6/self_attn/Transpose_output_0 &/blocks.6/self_attn/Reshape_4_output_0#/blocks.6/self_attn/MatMul_output_0/blocks.6/self_attn/MatMul"MatMul (/blocks.6/self_attn/Constant_56_output_0/blocks.6/self_attn/Constant_56"Constant*A value*5B+/blocks.6/self_attn/Constant_56_attr::valueJ5A  #/blocks.6/self_attn/MatMul_output_0 (/blocks.6/self_attn/Constant_56_output_0"/blocks.6/self_attn/Div_2_output_0/blocks.6/self_attn/Div_2"Div x "/blocks.6/self_attn/Div_2_output_0 attention_mask"/blocks.6/self_attn/Add_2_output_0/blocks.6/self_attn/Add_2"Add  "/blocks.6/self_attn/Add_2_output_0$/blocks.6/self_attn/Softmax_output_0/blocks.6/self_attn/Softmax"Softmax* axis x $/blocks.6/self_attn/Softmax_output_0#/blocks.6/self_attn/Cast_4_output_0/blocks.6/self_attn/Cast_4"Cast* to  #/blocks.6/self_attn/Cast_4_output_0 &/blocks.6/self_attn/Reshape_6_output_0%/blocks.6/self_attn/MatMul_1_output_0/blocks.6/self_attn/MatMul_1"MatMul  %/blocks.6/self_attn/MatMul_1_output_0(/blocks.6/self_attn/Transpose_3_output_0/blocks.6/self_attn/Transpose_3" Transpose* perm@@@@ fonnx::Unsqueeze_2343 Constant_4337"Constant*5 value*)BConstant_4337_attr::valueJ  #/blocks.6/self_attn/Gather_output_0 onnx::Unsqueeze_2343)/blocks.6/self_attn/Unsqueeze_30_output_0 /blocks.6/self_attn/Unsqueeze_30" Unsqueeze fonnx::Unsqueeze_2345 Constant_4339"Constant*5 value*)BConstant_4339_attr::valueJ  %/blocks.6/self_attn/Gather_1_output_0 onnx::Unsqueeze_2345)/blocks.6/self_attn/Unsqueeze_31_output_0 /blocks.6/self_attn/Unsqueeze_31" Unsqueeze (/blocks.6/self_attn/Constant_57_output_0/blocks.6/self_attn/Constant_57"Constant*G value*;B+/blocks.6/self_attn/Constant_57_attr::valueJ  )/blocks.6/self_attn/Unsqueeze_30_output_0 )/blocks.6/self_attn/Unsqueeze_31_output_0 (/blocks.6/self_attn/Constant_57_output_0&/blocks.6/self_attn/Concat_12_output_0/blocks.6/self_attn/Concat_12"Concat* axis  (/blocks.6/self_attn/Transpose_3_output_0 &/blocks.6/self_attn/Concat_12_output_0&/blocks.6/self_attn/Reshape_7_output_0/blocks.6/self_attn/Reshape_7"Reshape* allowzero  &/blocks.6/self_attn/Reshape_7_output_0 onnx::MatMul_8757*/blocks.6/self_attn/o_proj/MatMul_output_0!/blocks.6/self_attn/o_proj/MatMul"MatMul  )/blocks.6/input_layernorm/Cast_1_output_0 */blocks.6/self_attn/o_proj/MatMul_output_0/blocks.6/Add_output_0 /blocks.6/Add"Add  /blocks.6/Add_output_00/blocks.6/post_attention_layernorm/Cast_output_0'/blocks.6/post_attention_layernorm/Cast"Cast* to 4/blocks.6/post_attention_layernorm/Constant_output_0+/blocks.6/post_attention_layernorm/Constant"Constant*M value*AB7/blocks.6/post_attention_layernorm/Constant_attr::valueJ@  0/blocks.6/post_attention_layernorm/Cast_output_0 4/blocks.6/post_attention_layernorm/Constant_output_0//blocks.6/post_attention_layernorm/Pow_output_0&/blocks.6/post_attention_layernorm/Pow"Pow  //blocks.6/post_attention_layernorm/Pow_output_06/blocks.6/post_attention_layernorm/ReduceMean_output_0-/blocks.6/post_attention_layernorm/ReduceMean" ReduceMean* axes@* keepdims 6/blocks.6/post_attention_layernorm/Constant_1_output_0-/blocks.6/post_attention_layernorm/Constant_1"Constant*O value*CB9/blocks.6/post_attention_layernorm/Constant_1_attr::valueJ75  6/blocks.6/post_attention_layernorm/ReduceMean_output_0 6/blocks.6/post_attention_layernorm/Constant_1_output_0//blocks.6/post_attention_layernorm/Add_output_0&/blocks.6/post_attention_layernorm/Add"Add  //blocks.6/post_attention_layernorm/Add_output_00/blocks.6/post_attention_layernorm/Sqrt_output_0'/blocks.6/post_attention_layernorm/Sqrt"Sqrt 6/blocks.6/post_attention_layernorm/Constant_2_output_0-/blocks.6/post_attention_layernorm/Constant_2"Constant*O value*CB9/blocks.6/post_attention_layernorm/Constant_2_attr::valueJ?  6/blocks.6/post_attention_layernorm/Constant_2_output_0 0/blocks.6/post_attention_layernorm/Sqrt_output_0//blocks.6/post_attention_layernorm/Div_output_0&/blocks.6/post_attention_layernorm/Div"Div  0/blocks.6/post_attention_layernorm/Cast_output_02/blocks.6/post_attention_layernorm/Cast_1_output_0)/blocks.6/post_attention_layernorm/Cast_1"Cast* to  2/blocks.6/post_attention_layernorm/Cast_1_output_0 //blocks.6/post_attention_layernorm/Div_output_0//blocks.6/post_attention_layernorm/Mul_output_0&/blocks.6/post_attention_layernorm/Mul"Mul  //blocks.6/post_attention_layernorm/Mul_output_0 (blocks.6.post_attention_layernorm.weight1/blocks.6/post_attention_layernorm/Mul_1_output_0(/blocks.6/post_attention_layernorm/Mul_1"Mul  1/blocks.6/post_attention_layernorm/Mul_1_output_02/blocks.6/post_attention_layernorm/Cast_2_output_0)/blocks.6/post_attention_layernorm/Cast_2"Cast* to  2/blocks.6/post_attention_layernorm/Cast_2_output_0 onnx::MatMul_8758'/blocks.6/mlp/gate_proj/MatMul_output_0/blocks.6/mlp/gate_proj/MatMul"MatMul w '/blocks.6/mlp/gate_proj/MatMul_output_0%/blocks.6/mlp/act_fn/Sigmoid_output_0/blocks.6/mlp/act_fn/Sigmoid"Sigmoid  '/blocks.6/mlp/gate_proj/MatMul_output_0 %/blocks.6/mlp/act_fn/Sigmoid_output_0!/blocks.6/mlp/act_fn/Mul_output_0/blocks.6/mlp/act_fn/Mul"Mul  2/blocks.6/post_attention_layernorm/Cast_2_output_0 onnx::MatMul_8759%/blocks.6/mlp/up_proj/MatMul_output_0/blocks.6/mlp/up_proj/MatMul"MatMul ~ !/blocks.6/mlp/act_fn/Mul_output_0 %/blocks.6/mlp/up_proj/MatMul_output_0/blocks.6/mlp/Mul_output_0/blocks.6/mlp/Mul"Mul  /blocks.6/mlp/Mul_output_0 onnx::MatMul_8760'/blocks.6/mlp/down_proj/MatMul_output_0/blocks.6/mlp/down_proj/MatMul"MatMul  2/blocks.6/post_attention_layernorm/Cast_1_output_0 '/blocks.6/mlp/down_proj/MatMul_output_0/blocks.6/Add_1_output_0/blocks.6/Add_1"Add `/Constant_1_output_0 /Constant_1"Constant*1 value*%B/Constant_1_attr::valueJ [ past_key_values /Constant_1_output_0/Gather_7_output_0 /Gather_7"Gather* axis /blocks.7/Constant_output_0/blocks.7/Constant"Constant*J value*>B/blocks.7/Constant_attr::valueJ  /blocks.6/Add_1_output_0 /blocks.7/Constant_output_0/blocks.7/Reshape_output_0/blocks.7/Reshape"Reshape* allowzero v /blocks.7/Reshape_output_0'/blocks.7/input_layernorm/Cast_output_0/blocks.7/input_layernorm/Cast"Cast* to +/blocks.7/input_layernorm/Constant_output_0"/blocks.7/input_layernorm/Constant"Constant*D value*8B./blocks.7/input_layernorm/Constant_attr::valueJ@  '/blocks.7/input_layernorm/Cast_output_0 +/blocks.7/input_layernorm/Constant_output_0&/blocks.7/input_layernorm/Pow_output_0/blocks.7/input_layernorm/Pow"Pow  &/blocks.7/input_layernorm/Pow_output_0-/blocks.7/input_layernorm/ReduceMean_output_0$/blocks.7/input_layernorm/ReduceMean" ReduceMean* axes@* keepdims -/blocks.7/input_layernorm/Constant_1_output_0$/blocks.7/input_layernorm/Constant_1"Constant*F value*:B0/blocks.7/input_layernorm/Constant_1_attr::valueJ75  -/blocks.7/input_layernorm/ReduceMean_output_0 -/blocks.7/input_layernorm/Constant_1_output_0&/blocks.7/input_layernorm/Add_output_0/blocks.7/input_layernorm/Add"Add w &/blocks.7/input_layernorm/Add_output_0'/blocks.7/input_layernorm/Sqrt_output_0/blocks.7/input_layernorm/Sqrt"Sqrt -/blocks.7/input_layernorm/Constant_2_output_0$/blocks.7/input_layernorm/Constant_2"Constant*F value*:B0/blocks.7/input_layernorm/Constant_2_attr::valueJ?  -/blocks.7/input_layernorm/Constant_2_output_0 '/blocks.7/input_layernorm/Sqrt_output_0&/blocks.7/input_layernorm/Div_output_0/blocks.7/input_layernorm/Div"Div  '/blocks.7/input_layernorm/Cast_output_0)/blocks.7/input_layernorm/Cast_1_output_0 /blocks.7/input_layernorm/Cast_1"Cast* to  )/blocks.7/input_layernorm/Cast_1_output_0 &/blocks.7/input_layernorm/Div_output_0&/blocks.7/input_layernorm/Mul_output_0/blocks.7/input_layernorm/Mul"Mul  &/blocks.7/input_layernorm/Mul_output_0 blocks.7.input_layernorm.weight(/blocks.7/input_layernorm/Mul_1_output_0/blocks.7/input_layernorm/Mul_1"Mul  (/blocks.7/input_layernorm/Mul_1_output_0)/blocks.7/input_layernorm/Cast_2_output_0 /blocks.7/input_layernorm/Cast_2"Cast* to q )/blocks.7/input_layernorm/Cast_2_output_0"/blocks.7/self_attn/Shape_output_0/blocks.7/self_attn/Shape"Shape %/blocks.7/self_attn/Constant_output_0/blocks.7/self_attn/Constant"Constant*B value*6B(/blocks.7/self_attn/Constant_attr::valueJ  "/blocks.7/self_attn/Shape_output_0 %/blocks.7/self_attn/Constant_output_0#/blocks.7/self_attn/Gather_output_0/blocks.7/self_attn/Gather"Gather* axis u )/blocks.7/input_layernorm/Cast_2_output_0$/blocks.7/self_attn/Shape_1_output_0/blocks.7/self_attn/Shape_1"Shape '/blocks.7/self_attn/Constant_1_output_0/blocks.7/self_attn/Constant_1"Constant*D value*8B*/blocks.7/self_attn/Constant_1_attr::valueJ  $/blocks.7/self_attn/Shape_1_output_0 '/blocks.7/self_attn/Constant_1_output_0%/blocks.7/self_attn/Gather_1_output_0/blocks.7/self_attn/Gather_1"Gather* axis  )/blocks.7/input_layernorm/Cast_2_output_0 onnx::MatMul_8761*/blocks.7/self_attn/q_proj/MatMul_output_0!/blocks.7/self_attn/q_proj/MatMul"MatMul  )/blocks.7/input_layernorm/Cast_2_output_0 onnx::MatMul_8762*/blocks.7/self_attn/k_proj/MatMul_output_0!/blocks.7/self_attn/k_proj/MatMul"MatMul  )/blocks.7/input_layernorm/Cast_2_output_0 onnx::MatMul_8763*/blocks.7/self_attn/v_proj/MatMul_output_0!/blocks.7/self_attn/v_proj/MatMul"MatMul fonnx::Unsqueeze_2406 Constant_4392"Constant*5 value*)BConstant_4392_attr::valueJ  #/blocks.7/self_attn/Gather_output_0 onnx::Unsqueeze_2406&/blocks.7/self_attn/Unsqueeze_output_0/blocks.7/self_attn/Unsqueeze" Unsqueeze fonnx::Unsqueeze_2408 Constant_4394"Constant*5 value*)BConstant_4394_attr::valueJ  %/blocks.7/self_attn/Gather_1_output_0 onnx::Unsqueeze_2408(/blocks.7/self_attn/Unsqueeze_1_output_0/blocks.7/self_attn/Unsqueeze_1" Unsqueeze '/blocks.7/self_attn/Constant_2_output_0/blocks.7/self_attn/Constant_2"Constant*F value*:B*/blocks.7/self_attn/Constant_2_attr::valueJ '/blocks.7/self_attn/Constant_3_output_0/blocks.7/self_attn/Constant_3"Constant*F value*:B*/blocks.7/self_attn/Constant_3_attr::valueJ  &/blocks.7/self_attn/Unsqueeze_output_0 (/blocks.7/self_attn/Unsqueeze_1_output_0 '/blocks.7/self_attn/Constant_2_output_0 '/blocks.7/self_attn/Constant_3_output_0#/blocks.7/self_attn/Concat_output_0/blocks.7/self_attn/Concat"Concat* axis  */blocks.7/self_attn/q_proj/MatMul_output_0 #/blocks.7/self_attn/Concat_output_0$/blocks.7/self_attn/Reshape_output_0/blocks.7/self_attn/Reshape"Reshape* allowzero fonnx::Unsqueeze_2416 Constant_4400"Constant*5 value*)BConstant_4400_attr::valueJ  #/blocks.7/self_attn/Gather_output_0 onnx::Unsqueeze_2416(/blocks.7/self_attn/Unsqueeze_2_output_0/blocks.7/self_attn/Unsqueeze_2" Unsqueeze fonnx::Unsqueeze_2418 Constant_4402"Constant*5 value*)BConstant_4402_attr::valueJ  %/blocks.7/self_attn/Gather_1_output_0 onnx::Unsqueeze_2418(/blocks.7/self_attn/Unsqueeze_3_output_0/blocks.7/self_attn/Unsqueeze_3" Unsqueeze '/blocks.7/self_attn/Constant_4_output_0/blocks.7/self_attn/Constant_4"Constant*F value*:B*/blocks.7/self_attn/Constant_4_attr::valueJ '/blocks.7/self_attn/Constant_5_output_0/blocks.7/self_attn/Constant_5"Constant*F value*:B*/blocks.7/self_attn/Constant_5_attr::valueJ  (/blocks.7/self_attn/Unsqueeze_2_output_0 (/blocks.7/self_attn/Unsqueeze_3_output_0 '/blocks.7/self_attn/Constant_4_output_0 '/blocks.7/self_attn/Constant_5_output_0%/blocks.7/self_attn/Concat_1_output_0/blocks.7/self_attn/Concat_1"Concat* axis fonnx::Unsqueeze_2425 Constant_4407"Constant*5 value*)BConstant_4407_attr::valueJ  #/blocks.7/self_attn/Gather_output_0 onnx::Unsqueeze_2425(/blocks.7/self_attn/Unsqueeze_4_output_0/blocks.7/self_attn/Unsqueeze_4" Unsqueeze fonnx::Unsqueeze_2427 Constant_4409"Constant*5 value*)BConstant_4409_attr::valueJ  %/blocks.7/self_attn/Gather_1_output_0 onnx::Unsqueeze_2427(/blocks.7/self_attn/Unsqueeze_5_output_0/blocks.7/self_attn/Unsqueeze_5" Unsqueeze '/blocks.7/self_attn/Constant_6_output_0/blocks.7/self_attn/Constant_6"Constant*F value*:B*/blocks.7/self_attn/Constant_6_attr::valueJ '/blocks.7/self_attn/Constant_7_output_0/blocks.7/self_attn/Constant_7"Constant*F value*:B*/blocks.7/self_attn/Constant_7_attr::valueJ  (/blocks.7/self_attn/Unsqueeze_4_output_0 (/blocks.7/self_attn/Unsqueeze_5_output_0 '/blocks.7/self_attn/Constant_6_output_0 '/blocks.7/self_attn/Constant_7_output_0%/blocks.7/self_attn/Concat_2_output_0/blocks.7/self_attn/Concat_2"Concat* axis  */blocks.7/self_attn/k_proj/MatMul_output_0 %/blocks.7/self_attn/Concat_1_output_0&/blocks.7/self_attn/Reshape_1_output_0/blocks.7/self_attn/Reshape_1"Reshape* allowzero  */blocks.7/self_attn/v_proj/MatMul_output_0 %/blocks.7/self_attn/Concat_2_output_0&/blocks.7/self_attn/Reshape_2_output_0/blocks.7/self_attn/Reshape_2"Reshape* allowzero  $/blocks.7/self_attn/Reshape_output_0(/blocks.7/self_attn/q_norm/Cast_output_0/blocks.7/self_attn/q_norm/Cast"Cast* to ,/blocks.7/self_attn/q_norm/Constant_output_0#/blocks.7/self_attn/q_norm/Constant"Constant*E value*9B//blocks.7/self_attn/q_norm/Constant_attr::valueJ@  (/blocks.7/self_attn/q_norm/Cast_output_0 ,/blocks.7/self_attn/q_norm/Constant_output_0'/blocks.7/self_attn/q_norm/Pow_output_0/blocks.7/self_attn/q_norm/Pow"Pow  '/blocks.7/self_attn/q_norm/Pow_output_0./blocks.7/self_attn/q_norm/ReduceMean_output_0%/blocks.7/self_attn/q_norm/ReduceMean" ReduceMean* axes@* keepdims ./blocks.7/self_attn/q_norm/Constant_1_output_0%/blocks.7/self_attn/q_norm/Constant_1"Constant*G value*;B1/blocks.7/self_attn/q_norm/Constant_1_attr::valueJ75  ./blocks.7/self_attn/q_norm/ReduceMean_output_0 ./blocks.7/self_attn/q_norm/Constant_1_output_0'/blocks.7/self_attn/q_norm/Add_output_0/blocks.7/self_attn/q_norm/Add"Add z '/blocks.7/self_attn/q_norm/Add_output_0(/blocks.7/self_attn/q_norm/Sqrt_output_0/blocks.7/self_attn/q_norm/Sqrt"Sqrt ./blocks.7/self_attn/q_norm/Constant_2_output_0%/blocks.7/self_attn/q_norm/Constant_2"Constant*G value*;B1/blocks.7/self_attn/q_norm/Constant_2_attr::valueJ?  ./blocks.7/self_attn/q_norm/Constant_2_output_0 (/blocks.7/self_attn/q_norm/Sqrt_output_0'/blocks.7/self_attn/q_norm/Div_output_0/blocks.7/self_attn/q_norm/Div"Div  (/blocks.7/self_attn/q_norm/Cast_output_0*/blocks.7/self_attn/q_norm/Cast_1_output_0!/blocks.7/self_attn/q_norm/Cast_1"Cast* to  */blocks.7/self_attn/q_norm/Cast_1_output_0 '/blocks.7/self_attn/q_norm/Div_output_0'/blocks.7/self_attn/q_norm/Mul_output_0/blocks.7/self_attn/q_norm/Mul"Mul  '/blocks.7/self_attn/q_norm/Mul_output_0 blocks.7.self_attn.q_norm.weight)/blocks.7/self_attn/q_norm/Mul_1_output_0 /blocks.7/self_attn/q_norm/Mul_1"Mul  )/blocks.7/self_attn/q_norm/Mul_1_output_0*/blocks.7/self_attn/q_norm/Cast_2_output_0!/blocks.7/self_attn/q_norm/Cast_2"Cast* to  &/blocks.7/self_attn/Reshape_1_output_0(/blocks.7/self_attn/k_norm/Cast_output_0/blocks.7/self_attn/k_norm/Cast"Cast* to ,/blocks.7/self_attn/k_norm/Constant_output_0#/blocks.7/self_attn/k_norm/Constant"Constant*E value*9B//blocks.7/self_attn/k_norm/Constant_attr::valueJ@  (/blocks.7/self_attn/k_norm/Cast_output_0 ,/blocks.7/self_attn/k_norm/Constant_output_0'/blocks.7/self_attn/k_norm/Pow_output_0/blocks.7/self_attn/k_norm/Pow"Pow  '/blocks.7/self_attn/k_norm/Pow_output_0./blocks.7/self_attn/k_norm/ReduceMean_output_0%/blocks.7/self_attn/k_norm/ReduceMean" ReduceMean* axes@* keepdims ./blocks.7/self_attn/k_norm/Constant_1_output_0%/blocks.7/self_attn/k_norm/Constant_1"Constant*G value*;B1/blocks.7/self_attn/k_norm/Constant_1_attr::valueJ75  ./blocks.7/self_attn/k_norm/ReduceMean_output_0 ./blocks.7/self_attn/k_norm/Constant_1_output_0'/blocks.7/self_attn/k_norm/Add_output_0/blocks.7/self_attn/k_norm/Add"Add z '/blocks.7/self_attn/k_norm/Add_output_0(/blocks.7/self_attn/k_norm/Sqrt_output_0/blocks.7/self_attn/k_norm/Sqrt"Sqrt ./blocks.7/self_attn/k_norm/Constant_2_output_0%/blocks.7/self_attn/k_norm/Constant_2"Constant*G value*;B1/blocks.7/self_attn/k_norm/Constant_2_attr::valueJ?  ./blocks.7/self_attn/k_norm/Constant_2_output_0 (/blocks.7/self_attn/k_norm/Sqrt_output_0'/blocks.7/self_attn/k_norm/Div_output_0/blocks.7/self_attn/k_norm/Div"Div  (/blocks.7/self_attn/k_norm/Cast_output_0*/blocks.7/self_attn/k_norm/Cast_1_output_0!/blocks.7/self_attn/k_norm/Cast_1"Cast* to  */blocks.7/self_attn/k_norm/Cast_1_output_0 '/blocks.7/self_attn/k_norm/Div_output_0'/blocks.7/self_attn/k_norm/Mul_output_0/blocks.7/self_attn/k_norm/Mul"Mul  '/blocks.7/self_attn/k_norm/Mul_output_0 blocks.7.self_attn.k_norm.weight)/blocks.7/self_attn/k_norm/Mul_1_output_0 /blocks.7/self_attn/k_norm/Mul_1"Mul  )/blocks.7/self_attn/k_norm/Mul_1_output_0*/blocks.7/self_attn/k_norm/Cast_2_output_0!/blocks.7/self_attn/k_norm/Cast_2"Cast* to  */blocks.7/self_attn/q_norm/Cast_2_output_0 %/blocks.0/self_attn/Gather_2_output_0 /blocks.7/self_attn/Mul_output_0/blocks.7/self_attn/Mul"Mul v */blocks.7/self_attn/q_norm/Cast_2_output_0$/blocks.7/self_attn/Shape_2_output_0/blocks.7/self_attn/Shape_2"Shape '/blocks.7/self_attn/Constant_8_output_0/blocks.7/self_attn/Constant_8"Constant*D value*8B*/blocks.7/self_attn/Constant_8_attr::valueJ  $/blocks.7/self_attn/Shape_2_output_0 '/blocks.7/self_attn/Constant_8_output_0%/blocks.7/self_attn/Gather_2_output_0/blocks.7/self_attn/Gather_2"Gather* axis '/blocks.7/self_attn/Constant_9_output_0/blocks.7/self_attn/Constant_9"Constant*D value*8B*/blocks.7/self_attn/Constant_9_attr::valueJ  %/blocks.7/self_attn/Gather_2_output_0 '/blocks.7/self_attn/Constant_9_output_0 /blocks.7/self_attn/Div_output_0/blocks.7/self_attn/Div"Div p /blocks.7/self_attn/Div_output_0!/blocks.7/self_attn/Cast_output_0/blocks.7/self_attn/Cast"Cast* to u !/blocks.7/self_attn/Cast_output_0#/blocks.7/self_attn/Cast_1_output_0/blocks.7/self_attn/Cast_1"Cast* to (/blocks.7/self_attn/Constant_10_output_0/blocks.7/self_attn/Constant_10"Constant*G value*;B+/blocks.7/self_attn/Constant_10_attr::valueJ (/blocks.7/self_attn/Constant_11_output_0/blocks.7/self_attn/Constant_11"Constant*G value*;B+/blocks.7/self_attn/Constant_11_attr::valueJ (/blocks.7/self_attn/Constant_12_output_0/blocks.7/self_attn/Constant_12"Constant*G value*;B+/blocks.7/self_attn/Constant_12_attr::valueJ  #/blocks.7/self_attn/Cast_1_output_0 (/blocks.7/self_attn/Constant_12_output_0(/blocks.7/self_attn/Unsqueeze_6_output_0/blocks.7/self_attn/Unsqueeze_6" Unsqueeze (/blocks.7/self_attn/Constant_13_output_0/blocks.7/self_attn/Constant_13"Constant*G value*;B+/blocks.7/self_attn/Constant_13_attr::valueJ  */blocks.7/self_attn/q_norm/Cast_2_output_0 (/blocks.7/self_attn/Constant_11_output_0 (/blocks.7/self_attn/Unsqueeze_6_output_0 (/blocks.7/self_attn/Constant_10_output_0 (/blocks.7/self_attn/Constant_13_output_0"/blocks.7/self_attn/Slice_output_0/blocks.7/self_attn/Slice"Slice (/blocks.7/self_attn/Constant_14_output_0/blocks.7/self_attn/Constant_14"Constant*G value*;B+/blocks.7/self_attn/Constant_14_attr::valueJ (/blocks.7/self_attn/Constant_15_output_0/blocks.7/self_attn/Constant_15"Constant*G value*;B+/blocks.7/self_attn/Constant_15_attr::valueJ  #/blocks.7/self_attn/Cast_1_output_0 (/blocks.7/self_attn/Constant_15_output_0(/blocks.7/self_attn/Unsqueeze_7_output_0/blocks.7/self_attn/Unsqueeze_7" Unsqueeze (/blocks.7/self_attn/Constant_16_output_0/blocks.7/self_attn/Constant_16"Constant*G value*;B+/blocks.7/self_attn/Constant_16_attr::valueJ (/blocks.7/self_attn/Constant_17_output_0/blocks.7/self_attn/Constant_17"Constant*G value*;B+/blocks.7/self_attn/Constant_17_attr::valueJ  */blocks.7/self_attn/q_norm/Cast_2_output_0 (/blocks.7/self_attn/Unsqueeze_7_output_0 (/blocks.7/self_attn/Constant_16_output_0 (/blocks.7/self_attn/Constant_14_output_0 (/blocks.7/self_attn/Constant_17_output_0$/blocks.7/self_attn/Slice_1_output_0/blocks.7/self_attn/Slice_1"Slice f $/blocks.7/self_attn/Slice_1_output_0 /blocks.7/self_attn/Neg_output_0/blocks.7/self_attn/Neg"Neg  /blocks.7/self_attn/Neg_output_0 "/blocks.7/self_attn/Slice_output_0%/blocks.7/self_attn/Concat_3_output_0/blocks.7/self_attn/Concat_3"Concat* axis  %/blocks.7/self_attn/Concat_3_output_0 %/blocks.0/self_attn/Gather_3_output_0"/blocks.7/self_attn/Mul_1_output_0/blocks.7/self_attn/Mul_1"Mul  /blocks.7/self_attn/Mul_output_0 "/blocks.7/self_attn/Mul_1_output_0 /blocks.7/self_attn/Add_output_0/blocks.7/self_attn/Add"Add  */blocks.7/self_attn/k_norm/Cast_2_output_0 %/blocks.0/self_attn/Gather_2_output_0"/blocks.7/self_attn/Mul_2_output_0/blocks.7/self_attn/Mul_2"Mul v */blocks.7/self_attn/k_norm/Cast_2_output_0$/blocks.7/self_attn/Shape_3_output_0/blocks.7/self_attn/Shape_3"Shape (/blocks.7/self_attn/Constant_18_output_0/blocks.7/self_attn/Constant_18"Constant*E value*9B+/blocks.7/self_attn/Constant_18_attr::valueJ  $/blocks.7/self_attn/Shape_3_output_0 (/blocks.7/self_attn/Constant_18_output_0%/blocks.7/self_attn/Gather_3_output_0/blocks.7/self_attn/Gather_3"Gather* axis (/blocks.7/self_attn/Constant_19_output_0/blocks.7/self_attn/Constant_19"Constant*E value*9B+/blocks.7/self_attn/Constant_19_attr::valueJ  %/blocks.7/self_attn/Gather_3_output_0 (/blocks.7/self_attn/Constant_19_output_0"/blocks.7/self_attn/Div_1_output_0/blocks.7/self_attn/Div_1"Div v "/blocks.7/self_attn/Div_1_output_0#/blocks.7/self_attn/Cast_2_output_0/blocks.7/self_attn/Cast_2"Cast* to w #/blocks.7/self_attn/Cast_2_output_0#/blocks.7/self_attn/Cast_3_output_0/blocks.7/self_attn/Cast_3"Cast* to (/blocks.7/self_attn/Constant_20_output_0/blocks.7/self_attn/Constant_20"Constant*G value*;B+/blocks.7/self_attn/Constant_20_attr::valueJ (/blocks.7/self_attn/Constant_21_output_0/blocks.7/self_attn/Constant_21"Constant*G value*;B+/blocks.7/self_attn/Constant_21_attr::valueJ (/blocks.7/self_attn/Constant_22_output_0/blocks.7/self_attn/Constant_22"Constant*G value*;B+/blocks.7/self_attn/Constant_22_attr::valueJ  #/blocks.7/self_attn/Cast_3_output_0 (/blocks.7/self_attn/Constant_22_output_0(/blocks.7/self_attn/Unsqueeze_8_output_0/blocks.7/self_attn/Unsqueeze_8" Unsqueeze (/blocks.7/self_attn/Constant_23_output_0/blocks.7/self_attn/Constant_23"Constant*G value*;B+/blocks.7/self_attn/Constant_23_attr::valueJ  */blocks.7/self_attn/k_norm/Cast_2_output_0 (/blocks.7/self_attn/Constant_21_output_0 (/blocks.7/self_attn/Unsqueeze_8_output_0 (/blocks.7/self_attn/Constant_20_output_0 (/blocks.7/self_attn/Constant_23_output_0$/blocks.7/self_attn/Slice_2_output_0/blocks.7/self_attn/Slice_2"Slice (/blocks.7/self_attn/Constant_24_output_0/blocks.7/self_attn/Constant_24"Constant*G value*;B+/blocks.7/self_attn/Constant_24_attr::valueJ (/blocks.7/self_attn/Constant_25_output_0/blocks.7/self_attn/Constant_25"Constant*G value*;B+/blocks.7/self_attn/Constant_25_attr::valueJ  #/blocks.7/self_attn/Cast_3_output_0 (/blocks.7/self_attn/Constant_25_output_0(/blocks.7/self_attn/Unsqueeze_9_output_0/blocks.7/self_attn/Unsqueeze_9" Unsqueeze (/blocks.7/self_attn/Constant_26_output_0/blocks.7/self_attn/Constant_26"Constant*G value*;B+/blocks.7/self_attn/Constant_26_attr::valueJ (/blocks.7/self_attn/Constant_27_output_0/blocks.7/self_attn/Constant_27"Constant*G value*;B+/blocks.7/self_attn/Constant_27_attr::valueJ  */blocks.7/self_attn/k_norm/Cast_2_output_0 (/blocks.7/self_attn/Unsqueeze_9_output_0 (/blocks.7/self_attn/Constant_26_output_0 (/blocks.7/self_attn/Constant_24_output_0 (/blocks.7/self_attn/Constant_27_output_0$/blocks.7/self_attn/Slice_3_output_0/blocks.7/self_attn/Slice_3"Slice j $/blocks.7/self_attn/Slice_3_output_0"/blocks.7/self_attn/Neg_1_output_0/blocks.7/self_attn/Neg_1"Neg  "/blocks.7/self_attn/Neg_1_output_0 $/blocks.7/self_attn/Slice_2_output_0%/blocks.7/self_attn/Concat_4_output_0/blocks.7/self_attn/Concat_4"Concat* axis  %/blocks.7/self_attn/Concat_4_output_0 %/blocks.0/self_attn/Gather_3_output_0"/blocks.7/self_attn/Mul_3_output_0/blocks.7/self_attn/Mul_3"Mul  "/blocks.7/self_attn/Mul_2_output_0 "/blocks.7/self_attn/Mul_3_output_0"/blocks.7/self_attn/Add_1_output_0/blocks.7/self_attn/Add_1"Add  /Gather_7_output_0 /rotary/Constant_3_output_0%/blocks.7/self_attn/Gather_4_output_0/blocks.7/self_attn/Gather_4"Gather* axis  /Gather_7_output_0 /rotary/Constant_8_output_0%/blocks.7/self_attn/Gather_5_output_0/blocks.7/self_attn/Gather_5"Gather* axis  %/blocks.7/self_attn/Gather_4_output_0 "/blocks.7/self_attn/Add_1_output_0%/blocks.7/self_attn/Concat_5_output_0/blocks.7/self_attn/Concat_5"Concat* axis  %/blocks.7/self_attn/Gather_5_output_0 &/blocks.7/self_attn/Reshape_2_output_0%/blocks.7/self_attn/Concat_6_output_0/blocks.7/self_attn/Concat_6"Concat* axis (/blocks.7/self_attn/Constant_28_output_0/blocks.7/self_attn/Constant_28"Constant*G value*;B+/blocks.7/self_attn/Constant_28_attr::valueJ  %/blocks.7/self_attn/Concat_5_output_0 (/blocks.7/self_attn/Constant_28_output_0)/blocks.7/self_attn/Unsqueeze_10_output_0 /blocks.7/self_attn/Unsqueeze_10" Unsqueeze (/blocks.7/self_attn/Constant_29_output_0/blocks.7/self_attn/Constant_29"Constant*G value*;B+/blocks.7/self_attn/Constant_29_attr::valueJ  %/blocks.7/self_attn/Concat_6_output_0 (/blocks.7/self_attn/Constant_29_output_0)/blocks.7/self_attn/Unsqueeze_11_output_0 /blocks.7/self_attn/Unsqueeze_11" Unsqueeze  )/blocks.7/self_attn/Unsqueeze_10_output_0 )/blocks.7/self_attn/Unsqueeze_11_output_0%/blocks.7/self_attn/Concat_7_output_0/blocks.7/self_attn/Concat_7"Concat* axis  /blocks.7/self_attn/Add_output_0&/blocks.7/self_attn/Transpose_output_0/blocks.7/self_attn/Transpose" Transpose* perm@@@@  %/blocks.7/self_attn/Concat_5_output_0(/blocks.7/self_attn/Transpose_1_output_0/blocks.7/self_attn/Transpose_1" Transpose* perm@@@@  %/blocks.7/self_attn/Concat_6_output_0(/blocks.7/self_attn/Transpose_2_output_0/blocks.7/self_attn/Transpose_2" Transpose* perm@@@@ t (/blocks.7/self_attn/Transpose_1_output_0$/blocks.7/self_attn/Shape_4_output_0/blocks.7/self_attn/Shape_4"Shape (/blocks.7/self_attn/Constant_30_output_0/blocks.7/self_attn/Constant_30"Constant*E value*9B+/blocks.7/self_attn/Constant_30_attr::valueJ  $/blocks.7/self_attn/Shape_4_output_0 (/blocks.7/self_attn/Constant_30_output_0%/blocks.7/self_attn/Gather_6_output_0/blocks.7/self_attn/Gather_6"Gather* axis t (/blocks.7/self_attn/Transpose_1_output_0$/blocks.7/self_attn/Shape_5_output_0/blocks.7/self_attn/Shape_5"Shape (/blocks.7/self_attn/Constant_31_output_0/blocks.7/self_attn/Constant_31"Constant*E value*9B+/blocks.7/self_attn/Constant_31_attr::valueJ  $/blocks.7/self_attn/Shape_5_output_0 (/blocks.7/self_attn/Constant_31_output_0%/blocks.7/self_attn/Gather_7_output_0/blocks.7/self_attn/Gather_7"Gather* axis t (/blocks.7/self_attn/Transpose_1_output_0$/blocks.7/self_attn/Shape_6_output_0/blocks.7/self_attn/Shape_6"Shape (/blocks.7/self_attn/Constant_32_output_0/blocks.7/self_attn/Constant_32"Constant*E value*9B+/blocks.7/self_attn/Constant_32_attr::valueJ  $/blocks.7/self_attn/Shape_6_output_0 (/blocks.7/self_attn/Constant_32_output_0%/blocks.7/self_attn/Gather_8_output_0/blocks.7/self_attn/Gather_8"Gather* axis t (/blocks.7/self_attn/Transpose_1_output_0$/blocks.7/self_attn/Shape_7_output_0/blocks.7/self_attn/Shape_7"Shape (/blocks.7/self_attn/Constant_33_output_0/blocks.7/self_attn/Constant_33"Constant*E value*9B+/blocks.7/self_attn/Constant_33_attr::valueJ  $/blocks.7/self_attn/Shape_7_output_0 (/blocks.7/self_attn/Constant_33_output_0%/blocks.7/self_attn/Gather_9_output_0/blocks.7/self_attn/Gather_9"Gather* axis (/blocks.7/self_attn/Constant_34_output_0/blocks.7/self_attn/Constant_34"Constant*G value*;B+/blocks.7/self_attn/Constant_34_attr::valueJ  (/blocks.7/self_attn/Transpose_1_output_0 (/blocks.7/self_attn/Constant_34_output_0)/blocks.7/self_attn/Unsqueeze_12_output_0 /blocks.7/self_attn/Unsqueeze_12" Unsqueeze (/blocks.7/self_attn/Constant_35_output_0/blocks.7/self_attn/Constant_35"Constant*G value*;B+/blocks.7/self_attn/Constant_35_attr::valueJ  %/blocks.7/self_attn/Gather_6_output_0 (/blocks.7/self_attn/Constant_35_output_0)/blocks.7/self_attn/Unsqueeze_13_output_0 /blocks.7/self_attn/Unsqueeze_13" Unsqueeze (/blocks.7/self_attn/Constant_36_output_0/blocks.7/self_attn/Constant_36"Constant*G value*;B+/blocks.7/self_attn/Constant_36_attr::valueJ  %/blocks.7/self_attn/Gather_7_output_0 (/blocks.7/self_attn/Constant_36_output_0)/blocks.7/self_attn/Unsqueeze_14_output_0 /blocks.7/self_attn/Unsqueeze_14" Unsqueeze (/blocks.7/self_attn/Constant_37_output_0/blocks.7/self_attn/Constant_37"Constant*G value*;B+/blocks.7/self_attn/Constant_37_attr::valueJ (/blocks.7/self_attn/Constant_38_output_0/blocks.7/self_attn/Constant_38"Constant*G value*;B+/blocks.7/self_attn/Constant_38_attr::valueJ  %/blocks.7/self_attn/Gather_8_output_0 (/blocks.7/self_attn/Constant_38_output_0)/blocks.7/self_attn/Unsqueeze_15_output_0 /blocks.7/self_attn/Unsqueeze_15" Unsqueeze (/blocks.7/self_attn/Constant_39_output_0/blocks.7/self_attn/Constant_39"Constant*G value*;B+/blocks.7/self_attn/Constant_39_attr::valueJ  %/blocks.7/self_attn/Gather_9_output_0 (/blocks.7/self_attn/Constant_39_output_0)/blocks.7/self_attn/Unsqueeze_16_output_0 /blocks.7/self_attn/Unsqueeze_16" Unsqueeze  )/blocks.7/self_attn/Unsqueeze_13_output_0 )/blocks.7/self_attn/Unsqueeze_14_output_0 (/blocks.7/self_attn/Constant_37_output_0 )/blocks.7/self_attn/Unsqueeze_15_output_0 )/blocks.7/self_attn/Unsqueeze_16_output_0%/blocks.7/self_attn/Concat_8_output_0/blocks.7/self_attn/Concat_8"Concat* axis (/blocks.7/self_attn/Constant_40_output_0/blocks.7/self_attn/Constant_40"Constant*G value*;B+/blocks.7/self_attn/Constant_40_attr::valueJ  %/blocks.7/self_attn/Concat_8_output_0 (/blocks.7/self_attn/Constant_40_output_0&/blocks.7/self_attn/Reshape_3_output_0/blocks.7/self_attn/Reshape_3"Reshape* allowzero r &/blocks.7/self_attn/Reshape_3_output_0$/blocks.7/self_attn/Shape_8_output_0/blocks.7/self_attn/Shape_8"Shape  $/blocks.7/self_attn/Shape_8_output_0,/blocks.7/self_attn/ConstantOfShape_output_0#/blocks.7/self_attn/ConstantOfShape"ConstantOfShape*K value*?B//blocks.7/self_attn/ConstantOfShape_attr::valueJ (/blocks.7/self_attn/Constant_41_output_0/blocks.7/self_attn/Constant_41"Constant*E value*9B+/blocks.7/self_attn/Constant_41_attr::valueJ  ,/blocks.7/self_attn/ConstantOfShape_output_0 (/blocks.7/self_attn/Constant_41_output_0"/blocks.7/self_attn/Mul_4_output_0/blocks.7/self_attn/Mul_4"Mul  &/blocks.7/self_attn/Reshape_3_output_0 "/blocks.7/self_attn/Mul_4_output_0"/blocks.7/self_attn/Equal_output_0/blocks.7/self_attn/Equal"Equal  "/blocks.7/self_attn/Equal_output_0 ,/blocks.7/self_attn/ConstantOfShape_output_0 &/blocks.7/self_attn/Reshape_3_output_0"/blocks.7/self_attn/Where_output_0/blocks.7/self_attn/Where"Where  )/blocks.7/self_attn/Unsqueeze_12_output_0 "/blocks.7/self_attn/Where_output_0#/blocks.7/self_attn/Expand_output_0/blocks.7/self_attn/Expand"Expand (/blocks.7/self_attn/Constant_42_output_0/blocks.7/self_attn/Constant_42"Constant*E value*9B+/blocks.7/self_attn/Constant_42_attr::valueJ  %/blocks.7/self_attn/Gather_7_output_0 (/blocks.7/self_attn/Constant_42_output_0"/blocks.7/self_attn/Mul_5_output_0/blocks.7/self_attn/Mul_5"Mul fonnx::Unsqueeze_2570 Constant_4537"Constant*5 value*)BConstant_4537_attr::valueJ  %/blocks.7/self_attn/Gather_6_output_0 onnx::Unsqueeze_2570)/blocks.7/self_attn/Unsqueeze_17_output_0 /blocks.7/self_attn/Unsqueeze_17" Unsqueeze fonnx::Unsqueeze_2572 Constant_4539"Constant*5 value*)BConstant_4539_attr::valueJ  "/blocks.7/self_attn/Mul_5_output_0 onnx::Unsqueeze_2572)/blocks.7/self_attn/Unsqueeze_18_output_0 /blocks.7/self_attn/Unsqueeze_18" Unsqueeze fonnx::Unsqueeze_2574 Constant_4541"Constant*5 value*)BConstant_4541_attr::valueJ  %/blocks.7/self_attn/Gather_8_output_0 onnx::Unsqueeze_2574)/blocks.7/self_attn/Unsqueeze_19_output_0 /blocks.7/self_attn/Unsqueeze_19" Unsqueeze fonnx::Unsqueeze_2576 Constant_4543"Constant*5 value*)BConstant_4543_attr::valueJ  %/blocks.7/self_attn/Gather_9_output_0 onnx::Unsqueeze_2576)/blocks.7/self_attn/Unsqueeze_20_output_0 /blocks.7/self_attn/Unsqueeze_20" Unsqueeze  )/blocks.7/self_attn/Unsqueeze_17_output_0 )/blocks.7/self_attn/Unsqueeze_18_output_0 )/blocks.7/self_attn/Unsqueeze_19_output_0 )/blocks.7/self_attn/Unsqueeze_20_output_0%/blocks.7/self_attn/Concat_9_output_0/blocks.7/self_attn/Concat_9"Concat* axis  #/blocks.7/self_attn/Expand_output_0 %/blocks.7/self_attn/Concat_9_output_0&/blocks.7/self_attn/Reshape_4_output_0/blocks.7/self_attn/Reshape_4"Reshape* allowzero t (/blocks.7/self_attn/Transpose_2_output_0$/blocks.7/self_attn/Shape_9_output_0/blocks.7/self_attn/Shape_9"Shape (/blocks.7/self_attn/Constant_43_output_0/blocks.7/self_attn/Constant_43"Constant*E value*9B+/blocks.7/self_attn/Constant_43_attr::valueJ  $/blocks.7/self_attn/Shape_9_output_0 (/blocks.7/self_attn/Constant_43_output_0&/blocks.7/self_attn/Gather_10_output_0/blocks.7/self_attn/Gather_10"Gather* axis v (/blocks.7/self_attn/Transpose_2_output_0%/blocks.7/self_attn/Shape_10_output_0/blocks.7/self_attn/Shape_10"Shape (/blocks.7/self_attn/Constant_44_output_0/blocks.7/self_attn/Constant_44"Constant*E value*9B+/blocks.7/self_attn/Constant_44_attr::valueJ  %/blocks.7/self_attn/Shape_10_output_0 (/blocks.7/self_attn/Constant_44_output_0&/blocks.7/self_attn/Gather_11_output_0/blocks.7/self_attn/Gather_11"Gather* axis v (/blocks.7/self_attn/Transpose_2_output_0%/blocks.7/self_attn/Shape_11_output_0/blocks.7/self_attn/Shape_11"Shape (/blocks.7/self_attn/Constant_45_output_0/blocks.7/self_attn/Constant_45"Constant*E value*9B+/blocks.7/self_attn/Constant_45_attr::valueJ  %/blocks.7/self_attn/Shape_11_output_0 (/blocks.7/self_attn/Constant_45_output_0&/blocks.7/self_attn/Gather_12_output_0/blocks.7/self_attn/Gather_12"Gather* axis v (/blocks.7/self_attn/Transpose_2_output_0%/blocks.7/self_attn/Shape_12_output_0/blocks.7/self_attn/Shape_12"Shape (/blocks.7/self_attn/Constant_46_output_0/blocks.7/self_attn/Constant_46"Constant*E value*9B+/blocks.7/self_attn/Constant_46_attr::valueJ  %/blocks.7/self_attn/Shape_12_output_0 (/blocks.7/self_attn/Constant_46_output_0&/blocks.7/self_attn/Gather_13_output_0/blocks.7/self_attn/Gather_13"Gather* axis (/blocks.7/self_attn/Constant_47_output_0/blocks.7/self_attn/Constant_47"Constant*G value*;B+/blocks.7/self_attn/Constant_47_attr::valueJ  (/blocks.7/self_attn/Transpose_2_output_0 (/blocks.7/self_attn/Constant_47_output_0)/blocks.7/self_attn/Unsqueeze_21_output_0 /blocks.7/self_attn/Unsqueeze_21" Unsqueeze (/blocks.7/self_attn/Constant_48_output_0/blocks.7/self_attn/Constant_48"Constant*G value*;B+/blocks.7/self_attn/Constant_48_attr::valueJ  &/blocks.7/self_attn/Gather_10_output_0 (/blocks.7/self_attn/Constant_48_output_0)/blocks.7/self_attn/Unsqueeze_22_output_0 /blocks.7/self_attn/Unsqueeze_22" Unsqueeze (/blocks.7/self_attn/Constant_49_output_0/blocks.7/self_attn/Constant_49"Constant*G value*;B+/blocks.7/self_attn/Constant_49_attr::valueJ  &/blocks.7/self_attn/Gather_11_output_0 (/blocks.7/self_attn/Constant_49_output_0)/blocks.7/self_attn/Unsqueeze_23_output_0 /blocks.7/self_attn/Unsqueeze_23" Unsqueeze (/blocks.7/self_attn/Constant_50_output_0/blocks.7/self_attn/Constant_50"Constant*G value*;B+/blocks.7/self_attn/Constant_50_attr::valueJ (/blocks.7/self_attn/Constant_51_output_0/blocks.7/self_attn/Constant_51"Constant*G value*;B+/blocks.7/self_attn/Constant_51_attr::valueJ  &/blocks.7/self_attn/Gather_12_output_0 (/blocks.7/self_attn/Constant_51_output_0)/blocks.7/self_attn/Unsqueeze_24_output_0 /blocks.7/self_attn/Unsqueeze_24" Unsqueeze (/blocks.7/self_attn/Constant_52_output_0/blocks.7/self_attn/Constant_52"Constant*G value*;B+/blocks.7/self_attn/Constant_52_attr::valueJ  &/blocks.7/self_attn/Gather_13_output_0 (/blocks.7/self_attn/Constant_52_output_0)/blocks.7/self_attn/Unsqueeze_25_output_0 /blocks.7/self_attn/Unsqueeze_25" Unsqueeze  )/blocks.7/self_attn/Unsqueeze_22_output_0 )/blocks.7/self_attn/Unsqueeze_23_output_0 (/blocks.7/self_attn/Constant_50_output_0 )/blocks.7/self_attn/Unsqueeze_24_output_0 )/blocks.7/self_attn/Unsqueeze_25_output_0&/blocks.7/self_attn/Concat_10_output_0/blocks.7/self_attn/Concat_10"Concat* axis (/blocks.7/self_attn/Constant_53_output_0/blocks.7/self_attn/Constant_53"Constant*G value*;B+/blocks.7/self_attn/Constant_53_attr::valueJ  &/blocks.7/self_attn/Concat_10_output_0 (/blocks.7/self_attn/Constant_53_output_0&/blocks.7/self_attn/Reshape_5_output_0/blocks.7/self_attn/Reshape_5"Reshape* allowzero t &/blocks.7/self_attn/Reshape_5_output_0%/blocks.7/self_attn/Shape_13_output_0/blocks.7/self_attn/Shape_13"Shape  %/blocks.7/self_attn/Shape_13_output_0./blocks.7/self_attn/ConstantOfShape_1_output_0%/blocks.7/self_attn/ConstantOfShape_1"ConstantOfShape*M value*AB1/blocks.7/self_attn/ConstantOfShape_1_attr::valueJ (/blocks.7/self_attn/Constant_54_output_0/blocks.7/self_attn/Constant_54"Constant*E value*9B+/blocks.7/self_attn/Constant_54_attr::valueJ  ./blocks.7/self_attn/ConstantOfShape_1_output_0 (/blocks.7/self_attn/Constant_54_output_0"/blocks.7/self_attn/Mul_6_output_0/blocks.7/self_attn/Mul_6"Mul  &/blocks.7/self_attn/Reshape_5_output_0 "/blocks.7/self_attn/Mul_6_output_0$/blocks.7/self_attn/Equal_1_output_0/blocks.7/self_attn/Equal_1"Equal  $/blocks.7/self_attn/Equal_1_output_0 ./blocks.7/self_attn/ConstantOfShape_1_output_0 &/blocks.7/self_attn/Reshape_5_output_0$/blocks.7/self_attn/Where_1_output_0/blocks.7/self_attn/Where_1"Where  )/blocks.7/self_attn/Unsqueeze_21_output_0 $/blocks.7/self_attn/Where_1_output_0%/blocks.7/self_attn/Expand_1_output_0/blocks.7/self_attn/Expand_1"Expand (/blocks.7/self_attn/Constant_55_output_0/blocks.7/self_attn/Constant_55"Constant*E value*9B+/blocks.7/self_attn/Constant_55_attr::valueJ  &/blocks.7/self_attn/Gather_11_output_0 (/blocks.7/self_attn/Constant_55_output_0"/blocks.7/self_attn/Mul_7_output_0/blocks.7/self_attn/Mul_7"Mul fonnx::Unsqueeze_2616 Constant_4582"Constant*5 value*)BConstant_4582_attr::valueJ  &/blocks.7/self_attn/Gather_10_output_0 onnx::Unsqueeze_2616)/blocks.7/self_attn/Unsqueeze_26_output_0 /blocks.7/self_attn/Unsqueeze_26" Unsqueeze fonnx::Unsqueeze_2618 Constant_4584"Constant*5 value*)BConstant_4584_attr::valueJ  "/blocks.7/self_attn/Mul_7_output_0 onnx::Unsqueeze_2618)/blocks.7/self_attn/Unsqueeze_27_output_0 /blocks.7/self_attn/Unsqueeze_27" Unsqueeze fonnx::Unsqueeze_2620 Constant_4586"Constant*5 value*)BConstant_4586_attr::valueJ  &/blocks.7/self_attn/Gather_12_output_0 onnx::Unsqueeze_2620)/blocks.7/self_attn/Unsqueeze_28_output_0 /blocks.7/self_attn/Unsqueeze_28" Unsqueeze fonnx::Unsqueeze_2622 Constant_4588"Constant*5 value*)BConstant_4588_attr::valueJ  &/blocks.7/self_attn/Gather_13_output_0 onnx::Unsqueeze_2622)/blocks.7/self_attn/Unsqueeze_29_output_0 /blocks.7/self_attn/Unsqueeze_29" Unsqueeze  )/blocks.7/self_attn/Unsqueeze_26_output_0 )/blocks.7/self_attn/Unsqueeze_27_output_0 )/blocks.7/self_attn/Unsqueeze_28_output_0 )/blocks.7/self_attn/Unsqueeze_29_output_0&/blocks.7/self_attn/Concat_11_output_0/blocks.7/self_attn/Concat_11"Concat* axis  %/blocks.7/self_attn/Expand_1_output_0 &/blocks.7/self_attn/Concat_11_output_0&/blocks.7/self_attn/Reshape_6_output_0/blocks.7/self_attn/Reshape_6"Reshape* allowzero  &/blocks.7/self_attn/Transpose_output_0 &/blocks.7/self_attn/Reshape_4_output_0#/blocks.7/self_attn/MatMul_output_0/blocks.7/self_attn/MatMul"MatMul (/blocks.7/self_attn/Constant_56_output_0/blocks.7/self_attn/Constant_56"Constant*A value*5B+/blocks.7/self_attn/Constant_56_attr::valueJ5A  #/blocks.7/self_attn/MatMul_output_0 (/blocks.7/self_attn/Constant_56_output_0"/blocks.7/self_attn/Div_2_output_0/blocks.7/self_attn/Div_2"Div x "/blocks.7/self_attn/Div_2_output_0 attention_mask"/blocks.7/self_attn/Add_2_output_0/blocks.7/self_attn/Add_2"Add  "/blocks.7/self_attn/Add_2_output_0$/blocks.7/self_attn/Softmax_output_0/blocks.7/self_attn/Softmax"Softmax* axis x $/blocks.7/self_attn/Softmax_output_0#/blocks.7/self_attn/Cast_4_output_0/blocks.7/self_attn/Cast_4"Cast* to  #/blocks.7/self_attn/Cast_4_output_0 &/blocks.7/self_attn/Reshape_6_output_0%/blocks.7/self_attn/MatMul_1_output_0/blocks.7/self_attn/MatMul_1"MatMul  %/blocks.7/self_attn/MatMul_1_output_0(/blocks.7/self_attn/Transpose_3_output_0/blocks.7/self_attn/Transpose_3" Transpose* perm@@@@ fonnx::Unsqueeze_2634 Constant_4600"Constant*5 value*)BConstant_4600_attr::valueJ  #/blocks.7/self_attn/Gather_output_0 onnx::Unsqueeze_2634)/blocks.7/self_attn/Unsqueeze_30_output_0 /blocks.7/self_attn/Unsqueeze_30" Unsqueeze fonnx::Unsqueeze_2636 Constant_4602"Constant*5 value*)BConstant_4602_attr::valueJ  %/blocks.7/self_attn/Gather_1_output_0 onnx::Unsqueeze_2636)/blocks.7/self_attn/Unsqueeze_31_output_0 /blocks.7/self_attn/Unsqueeze_31" Unsqueeze (/blocks.7/self_attn/Constant_57_output_0/blocks.7/self_attn/Constant_57"Constant*G value*;B+/blocks.7/self_attn/Constant_57_attr::valueJ  )/blocks.7/self_attn/Unsqueeze_30_output_0 )/blocks.7/self_attn/Unsqueeze_31_output_0 (/blocks.7/self_attn/Constant_57_output_0&/blocks.7/self_attn/Concat_12_output_0/blocks.7/self_attn/Concat_12"Concat* axis  (/blocks.7/self_attn/Transpose_3_output_0 &/blocks.7/self_attn/Concat_12_output_0&/blocks.7/self_attn/Reshape_7_output_0/blocks.7/self_attn/Reshape_7"Reshape* allowzero  &/blocks.7/self_attn/Reshape_7_output_0 onnx::MatMul_8785*/blocks.7/self_attn/o_proj/MatMul_output_0!/blocks.7/self_attn/o_proj/MatMul"MatMul  )/blocks.7/input_layernorm/Cast_1_output_0 */blocks.7/self_attn/o_proj/MatMul_output_0/blocks.7/Add_output_0 /blocks.7/Add"Add  /blocks.7/Add_output_00/blocks.7/post_attention_layernorm/Cast_output_0'/blocks.7/post_attention_layernorm/Cast"Cast* to 4/blocks.7/post_attention_layernorm/Constant_output_0+/blocks.7/post_attention_layernorm/Constant"Constant*M value*AB7/blocks.7/post_attention_layernorm/Constant_attr::valueJ@  0/blocks.7/post_attention_layernorm/Cast_output_0 4/blocks.7/post_attention_layernorm/Constant_output_0//blocks.7/post_attention_layernorm/Pow_output_0&/blocks.7/post_attention_layernorm/Pow"Pow  //blocks.7/post_attention_layernorm/Pow_output_06/blocks.7/post_attention_layernorm/ReduceMean_output_0-/blocks.7/post_attention_layernorm/ReduceMean" ReduceMean* axes@* keepdims 6/blocks.7/post_attention_layernorm/Constant_1_output_0-/blocks.7/post_attention_layernorm/Constant_1"Constant*O value*CB9/blocks.7/post_attention_layernorm/Constant_1_attr::valueJ75  6/blocks.7/post_attention_layernorm/ReduceMean_output_0 6/blocks.7/post_attention_layernorm/Constant_1_output_0//blocks.7/post_attention_layernorm/Add_output_0&/blocks.7/post_attention_layernorm/Add"Add  //blocks.7/post_attention_layernorm/Add_output_00/blocks.7/post_attention_layernorm/Sqrt_output_0'/blocks.7/post_attention_layernorm/Sqrt"Sqrt 6/blocks.7/post_attention_layernorm/Constant_2_output_0-/blocks.7/post_attention_layernorm/Constant_2"Constant*O value*CB9/blocks.7/post_attention_layernorm/Constant_2_attr::valueJ?  6/blocks.7/post_attention_layernorm/Constant_2_output_0 0/blocks.7/post_attention_layernorm/Sqrt_output_0//blocks.7/post_attention_layernorm/Div_output_0&/blocks.7/post_attention_layernorm/Div"Div  0/blocks.7/post_attention_layernorm/Cast_output_02/blocks.7/post_attention_layernorm/Cast_1_output_0)/blocks.7/post_attention_layernorm/Cast_1"Cast* to  2/blocks.7/post_attention_layernorm/Cast_1_output_0 //blocks.7/post_attention_layernorm/Div_output_0//blocks.7/post_attention_layernorm/Mul_output_0&/blocks.7/post_attention_layernorm/Mul"Mul  //blocks.7/post_attention_layernorm/Mul_output_0 (blocks.7.post_attention_layernorm.weight1/blocks.7/post_attention_layernorm/Mul_1_output_0(/blocks.7/post_attention_layernorm/Mul_1"Mul  1/blocks.7/post_attention_layernorm/Mul_1_output_02/blocks.7/post_attention_layernorm/Cast_2_output_0)/blocks.7/post_attention_layernorm/Cast_2"Cast* to  2/blocks.7/post_attention_layernorm/Cast_2_output_0 onnx::MatMul_8786'/blocks.7/mlp/gate_proj/MatMul_output_0/blocks.7/mlp/gate_proj/MatMul"MatMul w '/blocks.7/mlp/gate_proj/MatMul_output_0%/blocks.7/mlp/act_fn/Sigmoid_output_0/blocks.7/mlp/act_fn/Sigmoid"Sigmoid  '/blocks.7/mlp/gate_proj/MatMul_output_0 %/blocks.7/mlp/act_fn/Sigmoid_output_0!/blocks.7/mlp/act_fn/Mul_output_0/blocks.7/mlp/act_fn/Mul"Mul  2/blocks.7/post_attention_layernorm/Cast_2_output_0 onnx::MatMul_8787%/blocks.7/mlp/up_proj/MatMul_output_0/blocks.7/mlp/up_proj/MatMul"MatMul ~ !/blocks.7/mlp/act_fn/Mul_output_0 %/blocks.7/mlp/up_proj/MatMul_output_0/blocks.7/mlp/Mul_output_0/blocks.7/mlp/Mul"Mul  /blocks.7/mlp/Mul_output_0 onnx::MatMul_8788'/blocks.7/mlp/down_proj/MatMul_output_0/blocks.7/mlp/down_proj/MatMul"MatMul  2/blocks.7/post_attention_layernorm/Cast_1_output_0 '/blocks.7/mlp/down_proj/MatMul_output_0/blocks.7/Add_1_output_0/blocks.7/Add_1"Add n past_key_values '/blocks.0/self_attn/Constant_5_output_0/Gather_8_output_0 /Gather_8"Gather* axis /blocks.8/Constant_output_0/blocks.8/Constant"Constant*J value*>B/blocks.8/Constant_attr::valueJ  /blocks.7/Add_1_output_0 /blocks.8/Constant_output_0/blocks.8/Reshape_output_0/blocks.8/Reshape"Reshape* allowzero v /blocks.8/Reshape_output_0'/blocks.8/input_layernorm/Cast_output_0/blocks.8/input_layernorm/Cast"Cast* to +/blocks.8/input_layernorm/Constant_output_0"/blocks.8/input_layernorm/Constant"Constant*D value*8B./blocks.8/input_layernorm/Constant_attr::valueJ@  '/blocks.8/input_layernorm/Cast_output_0 +/blocks.8/input_layernorm/Constant_output_0&/blocks.8/input_layernorm/Pow_output_0/blocks.8/input_layernorm/Pow"Pow  &/blocks.8/input_layernorm/Pow_output_0-/blocks.8/input_layernorm/ReduceMean_output_0$/blocks.8/input_layernorm/ReduceMean" ReduceMean* axes@* keepdims -/blocks.8/input_layernorm/Constant_1_output_0$/blocks.8/input_layernorm/Constant_1"Constant*F value*:B0/blocks.8/input_layernorm/Constant_1_attr::valueJ75  -/blocks.8/input_layernorm/ReduceMean_output_0 -/blocks.8/input_layernorm/Constant_1_output_0&/blocks.8/input_layernorm/Add_output_0/blocks.8/input_layernorm/Add"Add w &/blocks.8/input_layernorm/Add_output_0'/blocks.8/input_layernorm/Sqrt_output_0/blocks.8/input_layernorm/Sqrt"Sqrt -/blocks.8/input_layernorm/Constant_2_output_0$/blocks.8/input_layernorm/Constant_2"Constant*F value*:B0/blocks.8/input_layernorm/Constant_2_attr::valueJ?  -/blocks.8/input_layernorm/Constant_2_output_0 '/blocks.8/input_layernorm/Sqrt_output_0&/blocks.8/input_layernorm/Div_output_0/blocks.8/input_layernorm/Div"Div  '/blocks.8/input_layernorm/Cast_output_0)/blocks.8/input_layernorm/Cast_1_output_0 /blocks.8/input_layernorm/Cast_1"Cast* to  )/blocks.8/input_layernorm/Cast_1_output_0 &/blocks.8/input_layernorm/Div_output_0&/blocks.8/input_layernorm/Mul_output_0/blocks.8/input_layernorm/Mul"Mul  &/blocks.8/input_layernorm/Mul_output_0 blocks.8.input_layernorm.weight(/blocks.8/input_layernorm/Mul_1_output_0/blocks.8/input_layernorm/Mul_1"Mul  (/blocks.8/input_layernorm/Mul_1_output_0)/blocks.8/input_layernorm/Cast_2_output_0 /blocks.8/input_layernorm/Cast_2"Cast* to q )/blocks.8/input_layernorm/Cast_2_output_0"/blocks.8/self_attn/Shape_output_0/blocks.8/self_attn/Shape"Shape %/blocks.8/self_attn/Constant_output_0/blocks.8/self_attn/Constant"Constant*B value*6B(/blocks.8/self_attn/Constant_attr::valueJ  "/blocks.8/self_attn/Shape_output_0 %/blocks.8/self_attn/Constant_output_0#/blocks.8/self_attn/Gather_output_0/blocks.8/self_attn/Gather"Gather* axis u )/blocks.8/input_layernorm/Cast_2_output_0$/blocks.8/self_attn/Shape_1_output_0/blocks.8/self_attn/Shape_1"Shape '/blocks.8/self_attn/Constant_1_output_0/blocks.8/self_attn/Constant_1"Constant*D value*8B*/blocks.8/self_attn/Constant_1_attr::valueJ  $/blocks.8/self_attn/Shape_1_output_0 '/blocks.8/self_attn/Constant_1_output_0%/blocks.8/self_attn/Gather_1_output_0/blocks.8/self_attn/Gather_1"Gather* axis  )/blocks.8/input_layernorm/Cast_2_output_0 onnx::MatMul_8789*/blocks.8/self_attn/q_proj/MatMul_output_0!/blocks.8/self_attn/q_proj/MatMul"MatMul  )/blocks.8/input_layernorm/Cast_2_output_0 onnx::MatMul_8790*/blocks.8/self_attn/k_proj/MatMul_output_0!/blocks.8/self_attn/k_proj/MatMul"MatMul  )/blocks.8/input_layernorm/Cast_2_output_0 onnx::MatMul_8791*/blocks.8/self_attn/v_proj/MatMul_output_0!/blocks.8/self_attn/v_proj/MatMul"MatMul fonnx::Unsqueeze_2696 Constant_4654"Constant*5 value*)BConstant_4654_attr::valueJ  #/blocks.8/self_attn/Gather_output_0 onnx::Unsqueeze_2696&/blocks.8/self_attn/Unsqueeze_output_0/blocks.8/self_attn/Unsqueeze" Unsqueeze fonnx::Unsqueeze_2698 Constant_4656"Constant*5 value*)BConstant_4656_attr::valueJ  %/blocks.8/self_attn/Gather_1_output_0 onnx::Unsqueeze_2698(/blocks.8/self_attn/Unsqueeze_1_output_0/blocks.8/self_attn/Unsqueeze_1" Unsqueeze '/blocks.8/self_attn/Constant_2_output_0/blocks.8/self_attn/Constant_2"Constant*F value*:B*/blocks.8/self_attn/Constant_2_attr::valueJ '/blocks.8/self_attn/Constant_3_output_0/blocks.8/self_attn/Constant_3"Constant*F value*:B*/blocks.8/self_attn/Constant_3_attr::valueJ  &/blocks.8/self_attn/Unsqueeze_output_0 (/blocks.8/self_attn/Unsqueeze_1_output_0 '/blocks.8/self_attn/Constant_2_output_0 '/blocks.8/self_attn/Constant_3_output_0#/blocks.8/self_attn/Concat_output_0/blocks.8/self_attn/Concat"Concat* axis  */blocks.8/self_attn/q_proj/MatMul_output_0 #/blocks.8/self_attn/Concat_output_0$/blocks.8/self_attn/Reshape_output_0/blocks.8/self_attn/Reshape"Reshape* allowzero fonnx::Unsqueeze_2706 Constant_4662"Constant*5 value*)BConstant_4662_attr::valueJ  #/blocks.8/self_attn/Gather_output_0 onnx::Unsqueeze_2706(/blocks.8/self_attn/Unsqueeze_2_output_0/blocks.8/self_attn/Unsqueeze_2" Unsqueeze fonnx::Unsqueeze_2708 Constant_4664"Constant*5 value*)BConstant_4664_attr::valueJ  %/blocks.8/self_attn/Gather_1_output_0 onnx::Unsqueeze_2708(/blocks.8/self_attn/Unsqueeze_3_output_0/blocks.8/self_attn/Unsqueeze_3" Unsqueeze '/blocks.8/self_attn/Constant_4_output_0/blocks.8/self_attn/Constant_4"Constant*F value*:B*/blocks.8/self_attn/Constant_4_attr::valueJ '/blocks.8/self_attn/Constant_5_output_0/blocks.8/self_attn/Constant_5"Constant*F value*:B*/blocks.8/self_attn/Constant_5_attr::valueJ  (/blocks.8/self_attn/Unsqueeze_2_output_0 (/blocks.8/self_attn/Unsqueeze_3_output_0 '/blocks.8/self_attn/Constant_4_output_0 '/blocks.8/self_attn/Constant_5_output_0%/blocks.8/self_attn/Concat_1_output_0/blocks.8/self_attn/Concat_1"Concat* axis fonnx::Unsqueeze_2715 Constant_4669"Constant*5 value*)BConstant_4669_attr::valueJ  #/blocks.8/self_attn/Gather_output_0 onnx::Unsqueeze_2715(/blocks.8/self_attn/Unsqueeze_4_output_0/blocks.8/self_attn/Unsqueeze_4" Unsqueeze fonnx::Unsqueeze_2717 Constant_4671"Constant*5 value*)BConstant_4671_attr::valueJ  %/blocks.8/self_attn/Gather_1_output_0 onnx::Unsqueeze_2717(/blocks.8/self_attn/Unsqueeze_5_output_0/blocks.8/self_attn/Unsqueeze_5" Unsqueeze '/blocks.8/self_attn/Constant_6_output_0/blocks.8/self_attn/Constant_6"Constant*F value*:B*/blocks.8/self_attn/Constant_6_attr::valueJ '/blocks.8/self_attn/Constant_7_output_0/blocks.8/self_attn/Constant_7"Constant*F value*:B*/blocks.8/self_attn/Constant_7_attr::valueJ  (/blocks.8/self_attn/Unsqueeze_4_output_0 (/blocks.8/self_attn/Unsqueeze_5_output_0 '/blocks.8/self_attn/Constant_6_output_0 '/blocks.8/self_attn/Constant_7_output_0%/blocks.8/self_attn/Concat_2_output_0/blocks.8/self_attn/Concat_2"Concat* axis  */blocks.8/self_attn/k_proj/MatMul_output_0 %/blocks.8/self_attn/Concat_1_output_0&/blocks.8/self_attn/Reshape_1_output_0/blocks.8/self_attn/Reshape_1"Reshape* allowzero  */blocks.8/self_attn/v_proj/MatMul_output_0 %/blocks.8/self_attn/Concat_2_output_0&/blocks.8/self_attn/Reshape_2_output_0/blocks.8/self_attn/Reshape_2"Reshape* allowzero  $/blocks.8/self_attn/Reshape_output_0(/blocks.8/self_attn/q_norm/Cast_output_0/blocks.8/self_attn/q_norm/Cast"Cast* to ,/blocks.8/self_attn/q_norm/Constant_output_0#/blocks.8/self_attn/q_norm/Constant"Constant*E value*9B//blocks.8/self_attn/q_norm/Constant_attr::valueJ@  (/blocks.8/self_attn/q_norm/Cast_output_0 ,/blocks.8/self_attn/q_norm/Constant_output_0'/blocks.8/self_attn/q_norm/Pow_output_0/blocks.8/self_attn/q_norm/Pow"Pow  '/blocks.8/self_attn/q_norm/Pow_output_0./blocks.8/self_attn/q_norm/ReduceMean_output_0%/blocks.8/self_attn/q_norm/ReduceMean" ReduceMean* axes@* keepdims ./blocks.8/self_attn/q_norm/Constant_1_output_0%/blocks.8/self_attn/q_norm/Constant_1"Constant*G value*;B1/blocks.8/self_attn/q_norm/Constant_1_attr::valueJ75  ./blocks.8/self_attn/q_norm/ReduceMean_output_0 ./blocks.8/self_attn/q_norm/Constant_1_output_0'/blocks.8/self_attn/q_norm/Add_output_0/blocks.8/self_attn/q_norm/Add"Add z '/blocks.8/self_attn/q_norm/Add_output_0(/blocks.8/self_attn/q_norm/Sqrt_output_0/blocks.8/self_attn/q_norm/Sqrt"Sqrt ./blocks.8/self_attn/q_norm/Constant_2_output_0%/blocks.8/self_attn/q_norm/Constant_2"Constant*G value*;B1/blocks.8/self_attn/q_norm/Constant_2_attr::valueJ?  ./blocks.8/self_attn/q_norm/Constant_2_output_0 (/blocks.8/self_attn/q_norm/Sqrt_output_0'/blocks.8/self_attn/q_norm/Div_output_0/blocks.8/self_attn/q_norm/Div"Div  (/blocks.8/self_attn/q_norm/Cast_output_0*/blocks.8/self_attn/q_norm/Cast_1_output_0!/blocks.8/self_attn/q_norm/Cast_1"Cast* to  */blocks.8/self_attn/q_norm/Cast_1_output_0 '/blocks.8/self_attn/q_norm/Div_output_0'/blocks.8/self_attn/q_norm/Mul_output_0/blocks.8/self_attn/q_norm/Mul"Mul  '/blocks.8/self_attn/q_norm/Mul_output_0 blocks.8.self_attn.q_norm.weight)/blocks.8/self_attn/q_norm/Mul_1_output_0 /blocks.8/self_attn/q_norm/Mul_1"Mul  )/blocks.8/self_attn/q_norm/Mul_1_output_0*/blocks.8/self_attn/q_norm/Cast_2_output_0!/blocks.8/self_attn/q_norm/Cast_2"Cast* to  &/blocks.8/self_attn/Reshape_1_output_0(/blocks.8/self_attn/k_norm/Cast_output_0/blocks.8/self_attn/k_norm/Cast"Cast* to ,/blocks.8/self_attn/k_norm/Constant_output_0#/blocks.8/self_attn/k_norm/Constant"Constant*E value*9B//blocks.8/self_attn/k_norm/Constant_attr::valueJ@  (/blocks.8/self_attn/k_norm/Cast_output_0 ,/blocks.8/self_attn/k_norm/Constant_output_0'/blocks.8/self_attn/k_norm/Pow_output_0/blocks.8/self_attn/k_norm/Pow"Pow  '/blocks.8/self_attn/k_norm/Pow_output_0./blocks.8/self_attn/k_norm/ReduceMean_output_0%/blocks.8/self_attn/k_norm/ReduceMean" ReduceMean* axes@* keepdims ./blocks.8/self_attn/k_norm/Constant_1_output_0%/blocks.8/self_attn/k_norm/Constant_1"Constant*G value*;B1/blocks.8/self_attn/k_norm/Constant_1_attr::valueJ75  ./blocks.8/self_attn/k_norm/ReduceMean_output_0 ./blocks.8/self_attn/k_norm/Constant_1_output_0'/blocks.8/self_attn/k_norm/Add_output_0/blocks.8/self_attn/k_norm/Add"Add z '/blocks.8/self_attn/k_norm/Add_output_0(/blocks.8/self_attn/k_norm/Sqrt_output_0/blocks.8/self_attn/k_norm/Sqrt"Sqrt ./blocks.8/self_attn/k_norm/Constant_2_output_0%/blocks.8/self_attn/k_norm/Constant_2"Constant*G value*;B1/blocks.8/self_attn/k_norm/Constant_2_attr::valueJ?  ./blocks.8/self_attn/k_norm/Constant_2_output_0 (/blocks.8/self_attn/k_norm/Sqrt_output_0'/blocks.8/self_attn/k_norm/Div_output_0/blocks.8/self_attn/k_norm/Div"Div  (/blocks.8/self_attn/k_norm/Cast_output_0*/blocks.8/self_attn/k_norm/Cast_1_output_0!/blocks.8/self_attn/k_norm/Cast_1"Cast* to  */blocks.8/self_attn/k_norm/Cast_1_output_0 '/blocks.8/self_attn/k_norm/Div_output_0'/blocks.8/self_attn/k_norm/Mul_output_0/blocks.8/self_attn/k_norm/Mul"Mul  '/blocks.8/self_attn/k_norm/Mul_output_0 blocks.8.self_attn.k_norm.weight)/blocks.8/self_attn/k_norm/Mul_1_output_0 /blocks.8/self_attn/k_norm/Mul_1"Mul  )/blocks.8/self_attn/k_norm/Mul_1_output_0*/blocks.8/self_attn/k_norm/Cast_2_output_0!/blocks.8/self_attn/k_norm/Cast_2"Cast* to  */blocks.8/self_attn/q_norm/Cast_2_output_0 %/blocks.0/self_attn/Gather_2_output_0 /blocks.8/self_attn/Mul_output_0/blocks.8/self_attn/Mul"Mul v */blocks.8/self_attn/q_norm/Cast_2_output_0$/blocks.8/self_attn/Shape_2_output_0/blocks.8/self_attn/Shape_2"Shape '/blocks.8/self_attn/Constant_8_output_0/blocks.8/self_attn/Constant_8"Constant*D value*8B*/blocks.8/self_attn/Constant_8_attr::valueJ  $/blocks.8/self_attn/Shape_2_output_0 '/blocks.8/self_attn/Constant_8_output_0%/blocks.8/self_attn/Gather_2_output_0/blocks.8/self_attn/Gather_2"Gather* axis '/blocks.8/self_attn/Constant_9_output_0/blocks.8/self_attn/Constant_9"Constant*D value*8B*/blocks.8/self_attn/Constant_9_attr::valueJ  %/blocks.8/self_attn/Gather_2_output_0 '/blocks.8/self_attn/Constant_9_output_0 /blocks.8/self_attn/Div_output_0/blocks.8/self_attn/Div"Div p /blocks.8/self_attn/Div_output_0!/blocks.8/self_attn/Cast_output_0/blocks.8/self_attn/Cast"Cast* to u !/blocks.8/self_attn/Cast_output_0#/blocks.8/self_attn/Cast_1_output_0/blocks.8/self_attn/Cast_1"Cast* to (/blocks.8/self_attn/Constant_10_output_0/blocks.8/self_attn/Constant_10"Constant*G value*;B+/blocks.8/self_attn/Constant_10_attr::valueJ (/blocks.8/self_attn/Constant_11_output_0/blocks.8/self_attn/Constant_11"Constant*G value*;B+/blocks.8/self_attn/Constant_11_attr::valueJ (/blocks.8/self_attn/Constant_12_output_0/blocks.8/self_attn/Constant_12"Constant*G value*;B+/blocks.8/self_attn/Constant_12_attr::valueJ  #/blocks.8/self_attn/Cast_1_output_0 (/blocks.8/self_attn/Constant_12_output_0(/blocks.8/self_attn/Unsqueeze_6_output_0/blocks.8/self_attn/Unsqueeze_6" Unsqueeze (/blocks.8/self_attn/Constant_13_output_0/blocks.8/self_attn/Constant_13"Constant*G value*;B+/blocks.8/self_attn/Constant_13_attr::valueJ  */blocks.8/self_attn/q_norm/Cast_2_output_0 (/blocks.8/self_attn/Constant_11_output_0 (/blocks.8/self_attn/Unsqueeze_6_output_0 (/blocks.8/self_attn/Constant_10_output_0 (/blocks.8/self_attn/Constant_13_output_0"/blocks.8/self_attn/Slice_output_0/blocks.8/self_attn/Slice"Slice (/blocks.8/self_attn/Constant_14_output_0/blocks.8/self_attn/Constant_14"Constant*G value*;B+/blocks.8/self_attn/Constant_14_attr::valueJ (/blocks.8/self_attn/Constant_15_output_0/blocks.8/self_attn/Constant_15"Constant*G value*;B+/blocks.8/self_attn/Constant_15_attr::valueJ  #/blocks.8/self_attn/Cast_1_output_0 (/blocks.8/self_attn/Constant_15_output_0(/blocks.8/self_attn/Unsqueeze_7_output_0/blocks.8/self_attn/Unsqueeze_7" Unsqueeze (/blocks.8/self_attn/Constant_16_output_0/blocks.8/self_attn/Constant_16"Constant*G value*;B+/blocks.8/self_attn/Constant_16_attr::valueJ (/blocks.8/self_attn/Constant_17_output_0/blocks.8/self_attn/Constant_17"Constant*G value*;B+/blocks.8/self_attn/Constant_17_attr::valueJ  */blocks.8/self_attn/q_norm/Cast_2_output_0 (/blocks.8/self_attn/Unsqueeze_7_output_0 (/blocks.8/self_attn/Constant_16_output_0 (/blocks.8/self_attn/Constant_14_output_0 (/blocks.8/self_attn/Constant_17_output_0$/blocks.8/self_attn/Slice_1_output_0/blocks.8/self_attn/Slice_1"Slice f $/blocks.8/self_attn/Slice_1_output_0 /blocks.8/self_attn/Neg_output_0/blocks.8/self_attn/Neg"Neg  /blocks.8/self_attn/Neg_output_0 "/blocks.8/self_attn/Slice_output_0%/blocks.8/self_attn/Concat_3_output_0/blocks.8/self_attn/Concat_3"Concat* axis  %/blocks.8/self_attn/Concat_3_output_0 %/blocks.0/self_attn/Gather_3_output_0"/blocks.8/self_attn/Mul_1_output_0/blocks.8/self_attn/Mul_1"Mul  /blocks.8/self_attn/Mul_output_0 "/blocks.8/self_attn/Mul_1_output_0 /blocks.8/self_attn/Add_output_0/blocks.8/self_attn/Add"Add  */blocks.8/self_attn/k_norm/Cast_2_output_0 %/blocks.0/self_attn/Gather_2_output_0"/blocks.8/self_attn/Mul_2_output_0/blocks.8/self_attn/Mul_2"Mul v */blocks.8/self_attn/k_norm/Cast_2_output_0$/blocks.8/self_attn/Shape_3_output_0/blocks.8/self_attn/Shape_3"Shape (/blocks.8/self_attn/Constant_18_output_0/blocks.8/self_attn/Constant_18"Constant*E value*9B+/blocks.8/self_attn/Constant_18_attr::valueJ  $/blocks.8/self_attn/Shape_3_output_0 (/blocks.8/self_attn/Constant_18_output_0%/blocks.8/self_attn/Gather_3_output_0/blocks.8/self_attn/Gather_3"Gather* axis (/blocks.8/self_attn/Constant_19_output_0/blocks.8/self_attn/Constant_19"Constant*E value*9B+/blocks.8/self_attn/Constant_19_attr::valueJ  %/blocks.8/self_attn/Gather_3_output_0 (/blocks.8/self_attn/Constant_19_output_0"/blocks.8/self_attn/Div_1_output_0/blocks.8/self_attn/Div_1"Div v "/blocks.8/self_attn/Div_1_output_0#/blocks.8/self_attn/Cast_2_output_0/blocks.8/self_attn/Cast_2"Cast* to w #/blocks.8/self_attn/Cast_2_output_0#/blocks.8/self_attn/Cast_3_output_0/blocks.8/self_attn/Cast_3"Cast* to (/blocks.8/self_attn/Constant_20_output_0/blocks.8/self_attn/Constant_20"Constant*G value*;B+/blocks.8/self_attn/Constant_20_attr::valueJ (/blocks.8/self_attn/Constant_21_output_0/blocks.8/self_attn/Constant_21"Constant*G value*;B+/blocks.8/self_attn/Constant_21_attr::valueJ (/blocks.8/self_attn/Constant_22_output_0/blocks.8/self_attn/Constant_22"Constant*G value*;B+/blocks.8/self_attn/Constant_22_attr::valueJ  #/blocks.8/self_attn/Cast_3_output_0 (/blocks.8/self_attn/Constant_22_output_0(/blocks.8/self_attn/Unsqueeze_8_output_0/blocks.8/self_attn/Unsqueeze_8" Unsqueeze (/blocks.8/self_attn/Constant_23_output_0/blocks.8/self_attn/Constant_23"Constant*G value*;B+/blocks.8/self_attn/Constant_23_attr::valueJ  */blocks.8/self_attn/k_norm/Cast_2_output_0 (/blocks.8/self_attn/Constant_21_output_0 (/blocks.8/self_attn/Unsqueeze_8_output_0 (/blocks.8/self_attn/Constant_20_output_0 (/blocks.8/self_attn/Constant_23_output_0$/blocks.8/self_attn/Slice_2_output_0/blocks.8/self_attn/Slice_2"Slice (/blocks.8/self_attn/Constant_24_output_0/blocks.8/self_attn/Constant_24"Constant*G value*;B+/blocks.8/self_attn/Constant_24_attr::valueJ (/blocks.8/self_attn/Constant_25_output_0/blocks.8/self_attn/Constant_25"Constant*G value*;B+/blocks.8/self_attn/Constant_25_attr::valueJ  #/blocks.8/self_attn/Cast_3_output_0 (/blocks.8/self_attn/Constant_25_output_0(/blocks.8/self_attn/Unsqueeze_9_output_0/blocks.8/self_attn/Unsqueeze_9" Unsqueeze (/blocks.8/self_attn/Constant_26_output_0/blocks.8/self_attn/Constant_26"Constant*G value*;B+/blocks.8/self_attn/Constant_26_attr::valueJ (/blocks.8/self_attn/Constant_27_output_0/blocks.8/self_attn/Constant_27"Constant*G value*;B+/blocks.8/self_attn/Constant_27_attr::valueJ  */blocks.8/self_attn/k_norm/Cast_2_output_0 (/blocks.8/self_attn/Unsqueeze_9_output_0 (/blocks.8/self_attn/Constant_26_output_0 (/blocks.8/self_attn/Constant_24_output_0 (/blocks.8/self_attn/Constant_27_output_0$/blocks.8/self_attn/Slice_3_output_0/blocks.8/self_attn/Slice_3"Slice j $/blocks.8/self_attn/Slice_3_output_0"/blocks.8/self_attn/Neg_1_output_0/blocks.8/self_attn/Neg_1"Neg  "/blocks.8/self_attn/Neg_1_output_0 $/blocks.8/self_attn/Slice_2_output_0%/blocks.8/self_attn/Concat_4_output_0/blocks.8/self_attn/Concat_4"Concat* axis  %/blocks.8/self_attn/Concat_4_output_0 %/blocks.0/self_attn/Gather_3_output_0"/blocks.8/self_attn/Mul_3_output_0/blocks.8/self_attn/Mul_3"Mul  "/blocks.8/self_attn/Mul_2_output_0 "/blocks.8/self_attn/Mul_3_output_0"/blocks.8/self_attn/Add_1_output_0/blocks.8/self_attn/Add_1"Add  /Gather_8_output_0 /rotary/Constant_3_output_0%/blocks.8/self_attn/Gather_4_output_0/blocks.8/self_attn/Gather_4"Gather* axis  /Gather_8_output_0 /rotary/Constant_8_output_0%/blocks.8/self_attn/Gather_5_output_0/blocks.8/self_attn/Gather_5"Gather* axis  %/blocks.8/self_attn/Gather_4_output_0 "/blocks.8/self_attn/Add_1_output_0%/blocks.8/self_attn/Concat_5_output_0/blocks.8/self_attn/Concat_5"Concat* axis  %/blocks.8/self_attn/Gather_5_output_0 &/blocks.8/self_attn/Reshape_2_output_0%/blocks.8/self_attn/Concat_6_output_0/blocks.8/self_attn/Concat_6"Concat* axis (/blocks.8/self_attn/Constant_28_output_0/blocks.8/self_attn/Constant_28"Constant*G value*;B+/blocks.8/self_attn/Constant_28_attr::valueJ  %/blocks.8/self_attn/Concat_5_output_0 (/blocks.8/self_attn/Constant_28_output_0)/blocks.8/self_attn/Unsqueeze_10_output_0 /blocks.8/self_attn/Unsqueeze_10" Unsqueeze (/blocks.8/self_attn/Constant_29_output_0/blocks.8/self_attn/Constant_29"Constant*G value*;B+/blocks.8/self_attn/Constant_29_attr::valueJ  %/blocks.8/self_attn/Concat_6_output_0 (/blocks.8/self_attn/Constant_29_output_0)/blocks.8/self_attn/Unsqueeze_11_output_0 /blocks.8/self_attn/Unsqueeze_11" Unsqueeze  )/blocks.8/self_attn/Unsqueeze_10_output_0 )/blocks.8/self_attn/Unsqueeze_11_output_0%/blocks.8/self_attn/Concat_7_output_0/blocks.8/self_attn/Concat_7"Concat* axis  /blocks.8/self_attn/Add_output_0&/blocks.8/self_attn/Transpose_output_0/blocks.8/self_attn/Transpose" Transpose* perm@@@@  %/blocks.8/self_attn/Concat_5_output_0(/blocks.8/self_attn/Transpose_1_output_0/blocks.8/self_attn/Transpose_1" Transpose* perm@@@@  %/blocks.8/self_attn/Concat_6_output_0(/blocks.8/self_attn/Transpose_2_output_0/blocks.8/self_attn/Transpose_2" Transpose* perm@@@@ t (/blocks.8/self_attn/Transpose_1_output_0$/blocks.8/self_attn/Shape_4_output_0/blocks.8/self_attn/Shape_4"Shape (/blocks.8/self_attn/Constant_30_output_0/blocks.8/self_attn/Constant_30"Constant*E value*9B+/blocks.8/self_attn/Constant_30_attr::valueJ  $/blocks.8/self_attn/Shape_4_output_0 (/blocks.8/self_attn/Constant_30_output_0%/blocks.8/self_attn/Gather_6_output_0/blocks.8/self_attn/Gather_6"Gather* axis t (/blocks.8/self_attn/Transpose_1_output_0$/blocks.8/self_attn/Shape_5_output_0/blocks.8/self_attn/Shape_5"Shape (/blocks.8/self_attn/Constant_31_output_0/blocks.8/self_attn/Constant_31"Constant*E value*9B+/blocks.8/self_attn/Constant_31_attr::valueJ  $/blocks.8/self_attn/Shape_5_output_0 (/blocks.8/self_attn/Constant_31_output_0%/blocks.8/self_attn/Gather_7_output_0/blocks.8/self_attn/Gather_7"Gather* axis t (/blocks.8/self_attn/Transpose_1_output_0$/blocks.8/self_attn/Shape_6_output_0/blocks.8/self_attn/Shape_6"Shape (/blocks.8/self_attn/Constant_32_output_0/blocks.8/self_attn/Constant_32"Constant*E value*9B+/blocks.8/self_attn/Constant_32_attr::valueJ  $/blocks.8/self_attn/Shape_6_output_0 (/blocks.8/self_attn/Constant_32_output_0%/blocks.8/self_attn/Gather_8_output_0/blocks.8/self_attn/Gather_8"Gather* axis t (/blocks.8/self_attn/Transpose_1_output_0$/blocks.8/self_attn/Shape_7_output_0/blocks.8/self_attn/Shape_7"Shape (/blocks.8/self_attn/Constant_33_output_0/blocks.8/self_attn/Constant_33"Constant*E value*9B+/blocks.8/self_attn/Constant_33_attr::valueJ  $/blocks.8/self_attn/Shape_7_output_0 (/blocks.8/self_attn/Constant_33_output_0%/blocks.8/self_attn/Gather_9_output_0/blocks.8/self_attn/Gather_9"Gather* axis (/blocks.8/self_attn/Constant_34_output_0/blocks.8/self_attn/Constant_34"Constant*G value*;B+/blocks.8/self_attn/Constant_34_attr::valueJ  (/blocks.8/self_attn/Transpose_1_output_0 (/blocks.8/self_attn/Constant_34_output_0)/blocks.8/self_attn/Unsqueeze_12_output_0 /blocks.8/self_attn/Unsqueeze_12" Unsqueeze (/blocks.8/self_attn/Constant_35_output_0/blocks.8/self_attn/Constant_35"Constant*G value*;B+/blocks.8/self_attn/Constant_35_attr::valueJ  %/blocks.8/self_attn/Gather_6_output_0 (/blocks.8/self_attn/Constant_35_output_0)/blocks.8/self_attn/Unsqueeze_13_output_0 /blocks.8/self_attn/Unsqueeze_13" Unsqueeze (/blocks.8/self_attn/Constant_36_output_0/blocks.8/self_attn/Constant_36"Constant*G value*;B+/blocks.8/self_attn/Constant_36_attr::valueJ  %/blocks.8/self_attn/Gather_7_output_0 (/blocks.8/self_attn/Constant_36_output_0)/blocks.8/self_attn/Unsqueeze_14_output_0 /blocks.8/self_attn/Unsqueeze_14" Unsqueeze (/blocks.8/self_attn/Constant_37_output_0/blocks.8/self_attn/Constant_37"Constant*G value*;B+/blocks.8/self_attn/Constant_37_attr::valueJ (/blocks.8/self_attn/Constant_38_output_0/blocks.8/self_attn/Constant_38"Constant*G value*;B+/blocks.8/self_attn/Constant_38_attr::valueJ  %/blocks.8/self_attn/Gather_8_output_0 (/blocks.8/self_attn/Constant_38_output_0)/blocks.8/self_attn/Unsqueeze_15_output_0 /blocks.8/self_attn/Unsqueeze_15" Unsqueeze (/blocks.8/self_attn/Constant_39_output_0/blocks.8/self_attn/Constant_39"Constant*G value*;B+/blocks.8/self_attn/Constant_39_attr::valueJ  %/blocks.8/self_attn/Gather_9_output_0 (/blocks.8/self_attn/Constant_39_output_0)/blocks.8/self_attn/Unsqueeze_16_output_0 /blocks.8/self_attn/Unsqueeze_16" Unsqueeze  )/blocks.8/self_attn/Unsqueeze_13_output_0 )/blocks.8/self_attn/Unsqueeze_14_output_0 (/blocks.8/self_attn/Constant_37_output_0 )/blocks.8/self_attn/Unsqueeze_15_output_0 )/blocks.8/self_attn/Unsqueeze_16_output_0%/blocks.8/self_attn/Concat_8_output_0/blocks.8/self_attn/Concat_8"Concat* axis (/blocks.8/self_attn/Constant_40_output_0/blocks.8/self_attn/Constant_40"Constant*G value*;B+/blocks.8/self_attn/Constant_40_attr::valueJ  %/blocks.8/self_attn/Concat_8_output_0 (/blocks.8/self_attn/Constant_40_output_0&/blocks.8/self_attn/Reshape_3_output_0/blocks.8/self_attn/Reshape_3"Reshape* allowzero r &/blocks.8/self_attn/Reshape_3_output_0$/blocks.8/self_attn/Shape_8_output_0/blocks.8/self_attn/Shape_8"Shape  $/blocks.8/self_attn/Shape_8_output_0,/blocks.8/self_attn/ConstantOfShape_output_0#/blocks.8/self_attn/ConstantOfShape"ConstantOfShape*K value*?B//blocks.8/self_attn/ConstantOfShape_attr::valueJ (/blocks.8/self_attn/Constant_41_output_0/blocks.8/self_attn/Constant_41"Constant*E value*9B+/blocks.8/self_attn/Constant_41_attr::valueJ  ,/blocks.8/self_attn/ConstantOfShape_output_0 (/blocks.8/self_attn/Constant_41_output_0"/blocks.8/self_attn/Mul_4_output_0/blocks.8/self_attn/Mul_4"Mul  &/blocks.8/self_attn/Reshape_3_output_0 "/blocks.8/self_attn/Mul_4_output_0"/blocks.8/self_attn/Equal_output_0/blocks.8/self_attn/Equal"Equal  "/blocks.8/self_attn/Equal_output_0 ,/blocks.8/self_attn/ConstantOfShape_output_0 &/blocks.8/self_attn/Reshape_3_output_0"/blocks.8/self_attn/Where_output_0/blocks.8/self_attn/Where"Where  )/blocks.8/self_attn/Unsqueeze_12_output_0 "/blocks.8/self_attn/Where_output_0#/blocks.8/self_attn/Expand_output_0/blocks.8/self_attn/Expand"Expand (/blocks.8/self_attn/Constant_42_output_0/blocks.8/self_attn/Constant_42"Constant*E value*9B+/blocks.8/self_attn/Constant_42_attr::valueJ  %/blocks.8/self_attn/Gather_7_output_0 (/blocks.8/self_attn/Constant_42_output_0"/blocks.8/self_attn/Mul_5_output_0/blocks.8/self_attn/Mul_5"Mul fonnx::Unsqueeze_2860 Constant_4799"Constant*5 value*)BConstant_4799_attr::valueJ  %/blocks.8/self_attn/Gather_6_output_0 onnx::Unsqueeze_2860)/blocks.8/self_attn/Unsqueeze_17_output_0 /blocks.8/self_attn/Unsqueeze_17" Unsqueeze fonnx::Unsqueeze_2862 Constant_4801"Constant*5 value*)BConstant_4801_attr::valueJ  "/blocks.8/self_attn/Mul_5_output_0 onnx::Unsqueeze_2862)/blocks.8/self_attn/Unsqueeze_18_output_0 /blocks.8/self_attn/Unsqueeze_18" Unsqueeze fonnx::Unsqueeze_2864 Constant_4803"Constant*5 value*)BConstant_4803_attr::valueJ  %/blocks.8/self_attn/Gather_8_output_0 onnx::Unsqueeze_2864)/blocks.8/self_attn/Unsqueeze_19_output_0 /blocks.8/self_attn/Unsqueeze_19" Unsqueeze fonnx::Unsqueeze_2866 Constant_4805"Constant*5 value*)BConstant_4805_attr::valueJ  %/blocks.8/self_attn/Gather_9_output_0 onnx::Unsqueeze_2866)/blocks.8/self_attn/Unsqueeze_20_output_0 /blocks.8/self_attn/Unsqueeze_20" Unsqueeze  )/blocks.8/self_attn/Unsqueeze_17_output_0 )/blocks.8/self_attn/Unsqueeze_18_output_0 )/blocks.8/self_attn/Unsqueeze_19_output_0 )/blocks.8/self_attn/Unsqueeze_20_output_0%/blocks.8/self_attn/Concat_9_output_0/blocks.8/self_attn/Concat_9"Concat* axis  #/blocks.8/self_attn/Expand_output_0 %/blocks.8/self_attn/Concat_9_output_0&/blocks.8/self_attn/Reshape_4_output_0/blocks.8/self_attn/Reshape_4"Reshape* allowzero t (/blocks.8/self_attn/Transpose_2_output_0$/blocks.8/self_attn/Shape_9_output_0/blocks.8/self_attn/Shape_9"Shape (/blocks.8/self_attn/Constant_43_output_0/blocks.8/self_attn/Constant_43"Constant*E value*9B+/blocks.8/self_attn/Constant_43_attr::valueJ  $/blocks.8/self_attn/Shape_9_output_0 (/blocks.8/self_attn/Constant_43_output_0&/blocks.8/self_attn/Gather_10_output_0/blocks.8/self_attn/Gather_10"Gather* axis v (/blocks.8/self_attn/Transpose_2_output_0%/blocks.8/self_attn/Shape_10_output_0/blocks.8/self_attn/Shape_10"Shape (/blocks.8/self_attn/Constant_44_output_0/blocks.8/self_attn/Constant_44"Constant*E value*9B+/blocks.8/self_attn/Constant_44_attr::valueJ  %/blocks.8/self_attn/Shape_10_output_0 (/blocks.8/self_attn/Constant_44_output_0&/blocks.8/self_attn/Gather_11_output_0/blocks.8/self_attn/Gather_11"Gather* axis v (/blocks.8/self_attn/Transpose_2_output_0%/blocks.8/self_attn/Shape_11_output_0/blocks.8/self_attn/Shape_11"Shape (/blocks.8/self_attn/Constant_45_output_0/blocks.8/self_attn/Constant_45"Constant*E value*9B+/blocks.8/self_attn/Constant_45_attr::valueJ  %/blocks.8/self_attn/Shape_11_output_0 (/blocks.8/self_attn/Constant_45_output_0&/blocks.8/self_attn/Gather_12_output_0/blocks.8/self_attn/Gather_12"Gather* axis v (/blocks.8/self_attn/Transpose_2_output_0%/blocks.8/self_attn/Shape_12_output_0/blocks.8/self_attn/Shape_12"Shape (/blocks.8/self_attn/Constant_46_output_0/blocks.8/self_attn/Constant_46"Constant*E value*9B+/blocks.8/self_attn/Constant_46_attr::valueJ  %/blocks.8/self_attn/Shape_12_output_0 (/blocks.8/self_attn/Constant_46_output_0&/blocks.8/self_attn/Gather_13_output_0/blocks.8/self_attn/Gather_13"Gather* axis (/blocks.8/self_attn/Constant_47_output_0/blocks.8/self_attn/Constant_47"Constant*G value*;B+/blocks.8/self_attn/Constant_47_attr::valueJ  (/blocks.8/self_attn/Transpose_2_output_0 (/blocks.8/self_attn/Constant_47_output_0)/blocks.8/self_attn/Unsqueeze_21_output_0 /blocks.8/self_attn/Unsqueeze_21" Unsqueeze (/blocks.8/self_attn/Constant_48_output_0/blocks.8/self_attn/Constant_48"Constant*G value*;B+/blocks.8/self_attn/Constant_48_attr::valueJ  &/blocks.8/self_attn/Gather_10_output_0 (/blocks.8/self_attn/Constant_48_output_0)/blocks.8/self_attn/Unsqueeze_22_output_0 /blocks.8/self_attn/Unsqueeze_22" Unsqueeze (/blocks.8/self_attn/Constant_49_output_0/blocks.8/self_attn/Constant_49"Constant*G value*;B+/blocks.8/self_attn/Constant_49_attr::valueJ  &/blocks.8/self_attn/Gather_11_output_0 (/blocks.8/self_attn/Constant_49_output_0)/blocks.8/self_attn/Unsqueeze_23_output_0 /blocks.8/self_attn/Unsqueeze_23" Unsqueeze (/blocks.8/self_attn/Constant_50_output_0/blocks.8/self_attn/Constant_50"Constant*G value*;B+/blocks.8/self_attn/Constant_50_attr::valueJ (/blocks.8/self_attn/Constant_51_output_0/blocks.8/self_attn/Constant_51"Constant*G value*;B+/blocks.8/self_attn/Constant_51_attr::valueJ  &/blocks.8/self_attn/Gather_12_output_0 (/blocks.8/self_attn/Constant_51_output_0)/blocks.8/self_attn/Unsqueeze_24_output_0 /blocks.8/self_attn/Unsqueeze_24" Unsqueeze (/blocks.8/self_attn/Constant_52_output_0/blocks.8/self_attn/Constant_52"Constant*G value*;B+/blocks.8/self_attn/Constant_52_attr::valueJ  &/blocks.8/self_attn/Gather_13_output_0 (/blocks.8/self_attn/Constant_52_output_0)/blocks.8/self_attn/Unsqueeze_25_output_0 /blocks.8/self_attn/Unsqueeze_25" Unsqueeze  )/blocks.8/self_attn/Unsqueeze_22_output_0 )/blocks.8/self_attn/Unsqueeze_23_output_0 (/blocks.8/self_attn/Constant_50_output_0 )/blocks.8/self_attn/Unsqueeze_24_output_0 )/blocks.8/self_attn/Unsqueeze_25_output_0&/blocks.8/self_attn/Concat_10_output_0/blocks.8/self_attn/Concat_10"Concat* axis (/blocks.8/self_attn/Constant_53_output_0/blocks.8/self_attn/Constant_53"Constant*G value*;B+/blocks.8/self_attn/Constant_53_attr::valueJ  &/blocks.8/self_attn/Concat_10_output_0 (/blocks.8/self_attn/Constant_53_output_0&/blocks.8/self_attn/Reshape_5_output_0/blocks.8/self_attn/Reshape_5"Reshape* allowzero t &/blocks.8/self_attn/Reshape_5_output_0%/blocks.8/self_attn/Shape_13_output_0/blocks.8/self_attn/Shape_13"Shape  %/blocks.8/self_attn/Shape_13_output_0./blocks.8/self_attn/ConstantOfShape_1_output_0%/blocks.8/self_attn/ConstantOfShape_1"ConstantOfShape*M value*AB1/blocks.8/self_attn/ConstantOfShape_1_attr::valueJ (/blocks.8/self_attn/Constant_54_output_0/blocks.8/self_attn/Constant_54"Constant*E value*9B+/blocks.8/self_attn/Constant_54_attr::valueJ  ./blocks.8/self_attn/ConstantOfShape_1_output_0 (/blocks.8/self_attn/Constant_54_output_0"/blocks.8/self_attn/Mul_6_output_0/blocks.8/self_attn/Mul_6"Mul  &/blocks.8/self_attn/Reshape_5_output_0 "/blocks.8/self_attn/Mul_6_output_0$/blocks.8/self_attn/Equal_1_output_0/blocks.8/self_attn/Equal_1"Equal  $/blocks.8/self_attn/Equal_1_output_0 ./blocks.8/self_attn/ConstantOfShape_1_output_0 &/blocks.8/self_attn/Reshape_5_output_0$/blocks.8/self_attn/Where_1_output_0/blocks.8/self_attn/Where_1"Where  )/blocks.8/self_attn/Unsqueeze_21_output_0 $/blocks.8/self_attn/Where_1_output_0%/blocks.8/self_attn/Expand_1_output_0/blocks.8/self_attn/Expand_1"Expand (/blocks.8/self_attn/Constant_55_output_0/blocks.8/self_attn/Constant_55"Constant*E value*9B+/blocks.8/self_attn/Constant_55_attr::valueJ  &/blocks.8/self_attn/Gather_11_output_0 (/blocks.8/self_attn/Constant_55_output_0"/blocks.8/self_attn/Mul_7_output_0/blocks.8/self_attn/Mul_7"Mul fonnx::Unsqueeze_2906 Constant_4844"Constant*5 value*)BConstant_4844_attr::valueJ  &/blocks.8/self_attn/Gather_10_output_0 onnx::Unsqueeze_2906)/blocks.8/self_attn/Unsqueeze_26_output_0 /blocks.8/self_attn/Unsqueeze_26" Unsqueeze fonnx::Unsqueeze_2908 Constant_4846"Constant*5 value*)BConstant_4846_attr::valueJ  "/blocks.8/self_attn/Mul_7_output_0 onnx::Unsqueeze_2908)/blocks.8/self_attn/Unsqueeze_27_output_0 /blocks.8/self_attn/Unsqueeze_27" Unsqueeze fonnx::Unsqueeze_2910 Constant_4848"Constant*5 value*)BConstant_4848_attr::valueJ  &/blocks.8/self_attn/Gather_12_output_0 onnx::Unsqueeze_2910)/blocks.8/self_attn/Unsqueeze_28_output_0 /blocks.8/self_attn/Unsqueeze_28" Unsqueeze fonnx::Unsqueeze_2912 Constant_4850"Constant*5 value*)BConstant_4850_attr::valueJ  &/blocks.8/self_attn/Gather_13_output_0 onnx::Unsqueeze_2912)/blocks.8/self_attn/Unsqueeze_29_output_0 /blocks.8/self_attn/Unsqueeze_29" Unsqueeze  )/blocks.8/self_attn/Unsqueeze_26_output_0 )/blocks.8/self_attn/Unsqueeze_27_output_0 )/blocks.8/self_attn/Unsqueeze_28_output_0 )/blocks.8/self_attn/Unsqueeze_29_output_0&/blocks.8/self_attn/Concat_11_output_0/blocks.8/self_attn/Concat_11"Concat* axis  %/blocks.8/self_attn/Expand_1_output_0 &/blocks.8/self_attn/Concat_11_output_0&/blocks.8/self_attn/Reshape_6_output_0/blocks.8/self_attn/Reshape_6"Reshape* allowzero  &/blocks.8/self_attn/Transpose_output_0 &/blocks.8/self_attn/Reshape_4_output_0#/blocks.8/self_attn/MatMul_output_0/blocks.8/self_attn/MatMul"MatMul (/blocks.8/self_attn/Constant_56_output_0/blocks.8/self_attn/Constant_56"Constant*A value*5B+/blocks.8/self_attn/Constant_56_attr::valueJ5A  #/blocks.8/self_attn/MatMul_output_0 (/blocks.8/self_attn/Constant_56_output_0"/blocks.8/self_attn/Div_2_output_0/blocks.8/self_attn/Div_2"Div x "/blocks.8/self_attn/Div_2_output_0 attention_mask"/blocks.8/self_attn/Add_2_output_0/blocks.8/self_attn/Add_2"Add  "/blocks.8/self_attn/Add_2_output_0$/blocks.8/self_attn/Softmax_output_0/blocks.8/self_attn/Softmax"Softmax* axis x $/blocks.8/self_attn/Softmax_output_0#/blocks.8/self_attn/Cast_4_output_0/blocks.8/self_attn/Cast_4"Cast* to  #/blocks.8/self_attn/Cast_4_output_0 &/blocks.8/self_attn/Reshape_6_output_0%/blocks.8/self_attn/MatMul_1_output_0/blocks.8/self_attn/MatMul_1"MatMul  %/blocks.8/self_attn/MatMul_1_output_0(/blocks.8/self_attn/Transpose_3_output_0/blocks.8/self_attn/Transpose_3" Transpose* perm@@@@ fonnx::Unsqueeze_2924 Constant_4862"Constant*5 value*)BConstant_4862_attr::valueJ  #/blocks.8/self_attn/Gather_output_0 onnx::Unsqueeze_2924)/blocks.8/self_attn/Unsqueeze_30_output_0 /blocks.8/self_attn/Unsqueeze_30" Unsqueeze fonnx::Unsqueeze_2926 Constant_4864"Constant*5 value*)BConstant_4864_attr::valueJ  %/blocks.8/self_attn/Gather_1_output_0 onnx::Unsqueeze_2926)/blocks.8/self_attn/Unsqueeze_31_output_0 /blocks.8/self_attn/Unsqueeze_31" Unsqueeze (/blocks.8/self_attn/Constant_57_output_0/blocks.8/self_attn/Constant_57"Constant*G value*;B+/blocks.8/self_attn/Constant_57_attr::valueJ  )/blocks.8/self_attn/Unsqueeze_30_output_0 )/blocks.8/self_attn/Unsqueeze_31_output_0 (/blocks.8/self_attn/Constant_57_output_0&/blocks.8/self_attn/Concat_12_output_0/blocks.8/self_attn/Concat_12"Concat* axis  (/blocks.8/self_attn/Transpose_3_output_0 &/blocks.8/self_attn/Concat_12_output_0&/blocks.8/self_attn/Reshape_7_output_0/blocks.8/self_attn/Reshape_7"Reshape* allowzero  &/blocks.8/self_attn/Reshape_7_output_0 onnx::MatMul_8813*/blocks.8/self_attn/o_proj/MatMul_output_0!/blocks.8/self_attn/o_proj/MatMul"MatMul  )/blocks.8/input_layernorm/Cast_1_output_0 */blocks.8/self_attn/o_proj/MatMul_output_0/blocks.8/Add_output_0 /blocks.8/Add"Add  /blocks.8/Add_output_00/blocks.8/post_attention_layernorm/Cast_output_0'/blocks.8/post_attention_layernorm/Cast"Cast* to 4/blocks.8/post_attention_layernorm/Constant_output_0+/blocks.8/post_attention_layernorm/Constant"Constant*M value*AB7/blocks.8/post_attention_layernorm/Constant_attr::valueJ@  0/blocks.8/post_attention_layernorm/Cast_output_0 4/blocks.8/post_attention_layernorm/Constant_output_0//blocks.8/post_attention_layernorm/Pow_output_0&/blocks.8/post_attention_layernorm/Pow"Pow  //blocks.8/post_attention_layernorm/Pow_output_06/blocks.8/post_attention_layernorm/ReduceMean_output_0-/blocks.8/post_attention_layernorm/ReduceMean" ReduceMean* axes@* keepdims 6/blocks.8/post_attention_layernorm/Constant_1_output_0-/blocks.8/post_attention_layernorm/Constant_1"Constant*O value*CB9/blocks.8/post_attention_layernorm/Constant_1_attr::valueJ75  6/blocks.8/post_attention_layernorm/ReduceMean_output_0 6/blocks.8/post_attention_layernorm/Constant_1_output_0//blocks.8/post_attention_layernorm/Add_output_0&/blocks.8/post_attention_layernorm/Add"Add  //blocks.8/post_attention_layernorm/Add_output_00/blocks.8/post_attention_layernorm/Sqrt_output_0'/blocks.8/post_attention_layernorm/Sqrt"Sqrt 6/blocks.8/post_attention_layernorm/Constant_2_output_0-/blocks.8/post_attention_layernorm/Constant_2"Constant*O value*CB9/blocks.8/post_attention_layernorm/Constant_2_attr::valueJ?  6/blocks.8/post_attention_layernorm/Constant_2_output_0 0/blocks.8/post_attention_layernorm/Sqrt_output_0//blocks.8/post_attention_layernorm/Div_output_0&/blocks.8/post_attention_layernorm/Div"Div  0/blocks.8/post_attention_layernorm/Cast_output_02/blocks.8/post_attention_layernorm/Cast_1_output_0)/blocks.8/post_attention_layernorm/Cast_1"Cast* to  2/blocks.8/post_attention_layernorm/Cast_1_output_0 //blocks.8/post_attention_layernorm/Div_output_0//blocks.8/post_attention_layernorm/Mul_output_0&/blocks.8/post_attention_layernorm/Mul"Mul  //blocks.8/post_attention_layernorm/Mul_output_0 (blocks.8.post_attention_layernorm.weight1/blocks.8/post_attention_layernorm/Mul_1_output_0(/blocks.8/post_attention_layernorm/Mul_1"Mul  1/blocks.8/post_attention_layernorm/Mul_1_output_02/blocks.8/post_attention_layernorm/Cast_2_output_0)/blocks.8/post_attention_layernorm/Cast_2"Cast* to  2/blocks.8/post_attention_layernorm/Cast_2_output_0 onnx::MatMul_8814'/blocks.8/mlp/gate_proj/MatMul_output_0/blocks.8/mlp/gate_proj/MatMul"MatMul w '/blocks.8/mlp/gate_proj/MatMul_output_0%/blocks.8/mlp/act_fn/Sigmoid_output_0/blocks.8/mlp/act_fn/Sigmoid"Sigmoid  '/blocks.8/mlp/gate_proj/MatMul_output_0 %/blocks.8/mlp/act_fn/Sigmoid_output_0!/blocks.8/mlp/act_fn/Mul_output_0/blocks.8/mlp/act_fn/Mul"Mul  2/blocks.8/post_attention_layernorm/Cast_2_output_0 onnx::MatMul_8815%/blocks.8/mlp/up_proj/MatMul_output_0/blocks.8/mlp/up_proj/MatMul"MatMul ~ !/blocks.8/mlp/act_fn/Mul_output_0 %/blocks.8/mlp/up_proj/MatMul_output_0/blocks.8/mlp/Mul_output_0/blocks.8/mlp/Mul"Mul  /blocks.8/mlp/Mul_output_0 onnx::MatMul_8816'/blocks.8/mlp/down_proj/MatMul_output_0/blocks.8/mlp/down_proj/MatMul"MatMul  2/blocks.8/post_attention_layernorm/Cast_1_output_0 '/blocks.8/mlp/down_proj/MatMul_output_0/blocks.8/Add_1_output_0/blocks.8/Add_1"Add `/Constant_2_output_0 /Constant_2"Constant*1 value*%B/Constant_2_attr::valueJ  [ past_key_values /Constant_2_output_0/Gather_9_output_0 /Gather_9"Gather* axis /blocks.9/Constant_output_0/blocks.9/Constant"Constant*J value*>B/blocks.9/Constant_attr::valueJ  /blocks.8/Add_1_output_0 /blocks.9/Constant_output_0/blocks.9/Reshape_output_0/blocks.9/Reshape"Reshape* allowzero v /blocks.9/Reshape_output_0'/blocks.9/input_layernorm/Cast_output_0/blocks.9/input_layernorm/Cast"Cast* to +/blocks.9/input_layernorm/Constant_output_0"/blocks.9/input_layernorm/Constant"Constant*D value*8B./blocks.9/input_layernorm/Constant_attr::valueJ@  '/blocks.9/input_layernorm/Cast_output_0 +/blocks.9/input_layernorm/Constant_output_0&/blocks.9/input_layernorm/Pow_output_0/blocks.9/input_layernorm/Pow"Pow  &/blocks.9/input_layernorm/Pow_output_0-/blocks.9/input_layernorm/ReduceMean_output_0$/blocks.9/input_layernorm/ReduceMean" ReduceMean* axes@* keepdims -/blocks.9/input_layernorm/Constant_1_output_0$/blocks.9/input_layernorm/Constant_1"Constant*F value*:B0/blocks.9/input_layernorm/Constant_1_attr::valueJ75  -/blocks.9/input_layernorm/ReduceMean_output_0 -/blocks.9/input_layernorm/Constant_1_output_0&/blocks.9/input_layernorm/Add_output_0/blocks.9/input_layernorm/Add"Add w &/blocks.9/input_layernorm/Add_output_0'/blocks.9/input_layernorm/Sqrt_output_0/blocks.9/input_layernorm/Sqrt"Sqrt -/blocks.9/input_layernorm/Constant_2_output_0$/blocks.9/input_layernorm/Constant_2"Constant*F value*:B0/blocks.9/input_layernorm/Constant_2_attr::valueJ?  -/blocks.9/input_layernorm/Constant_2_output_0 '/blocks.9/input_layernorm/Sqrt_output_0&/blocks.9/input_layernorm/Div_output_0/blocks.9/input_layernorm/Div"Div  '/blocks.9/input_layernorm/Cast_output_0)/blocks.9/input_layernorm/Cast_1_output_0 /blocks.9/input_layernorm/Cast_1"Cast* to  )/blocks.9/input_layernorm/Cast_1_output_0 &/blocks.9/input_layernorm/Div_output_0&/blocks.9/input_layernorm/Mul_output_0/blocks.9/input_layernorm/Mul"Mul  &/blocks.9/input_layernorm/Mul_output_0 blocks.9.input_layernorm.weight(/blocks.9/input_layernorm/Mul_1_output_0/blocks.9/input_layernorm/Mul_1"Mul  (/blocks.9/input_layernorm/Mul_1_output_0)/blocks.9/input_layernorm/Cast_2_output_0 /blocks.9/input_layernorm/Cast_2"Cast* to q )/blocks.9/input_layernorm/Cast_2_output_0"/blocks.9/self_attn/Shape_output_0/blocks.9/self_attn/Shape"Shape %/blocks.9/self_attn/Constant_output_0/blocks.9/self_attn/Constant"Constant*B value*6B(/blocks.9/self_attn/Constant_attr::valueJ  "/blocks.9/self_attn/Shape_output_0 %/blocks.9/self_attn/Constant_output_0#/blocks.9/self_attn/Gather_output_0/blocks.9/self_attn/Gather"Gather* axis u )/blocks.9/input_layernorm/Cast_2_output_0$/blocks.9/self_attn/Shape_1_output_0/blocks.9/self_attn/Shape_1"Shape '/blocks.9/self_attn/Constant_1_output_0/blocks.9/self_attn/Constant_1"Constant*D value*8B*/blocks.9/self_attn/Constant_1_attr::valueJ  $/blocks.9/self_attn/Shape_1_output_0 '/blocks.9/self_attn/Constant_1_output_0%/blocks.9/self_attn/Gather_1_output_0/blocks.9/self_attn/Gather_1"Gather* axis  )/blocks.9/input_layernorm/Cast_2_output_0 onnx::MatMul_8817*/blocks.9/self_attn/q_proj/MatMul_output_0!/blocks.9/self_attn/q_proj/MatMul"MatMul  )/blocks.9/input_layernorm/Cast_2_output_0 onnx::MatMul_8818*/blocks.9/self_attn/k_proj/MatMul_output_0!/blocks.9/self_attn/k_proj/MatMul"MatMul  )/blocks.9/input_layernorm/Cast_2_output_0 onnx::MatMul_8819*/blocks.9/self_attn/v_proj/MatMul_output_0!/blocks.9/self_attn/v_proj/MatMul"MatMul fonnx::Unsqueeze_2987 Constant_4917"Constant*5 value*)BConstant_4917_attr::valueJ  #/blocks.9/self_attn/Gather_output_0 onnx::Unsqueeze_2987&/blocks.9/self_attn/Unsqueeze_output_0/blocks.9/self_attn/Unsqueeze" Unsqueeze fonnx::Unsqueeze_2989 Constant_4919"Constant*5 value*)BConstant_4919_attr::valueJ  %/blocks.9/self_attn/Gather_1_output_0 onnx::Unsqueeze_2989(/blocks.9/self_attn/Unsqueeze_1_output_0/blocks.9/self_attn/Unsqueeze_1" Unsqueeze '/blocks.9/self_attn/Constant_2_output_0/blocks.9/self_attn/Constant_2"Constant*F value*:B*/blocks.9/self_attn/Constant_2_attr::valueJ '/blocks.9/self_attn/Constant_3_output_0/blocks.9/self_attn/Constant_3"Constant*F value*:B*/blocks.9/self_attn/Constant_3_attr::valueJ  &/blocks.9/self_attn/Unsqueeze_output_0 (/blocks.9/self_attn/Unsqueeze_1_output_0 '/blocks.9/self_attn/Constant_2_output_0 '/blocks.9/self_attn/Constant_3_output_0#/blocks.9/self_attn/Concat_output_0/blocks.9/self_attn/Concat"Concat* axis  */blocks.9/self_attn/q_proj/MatMul_output_0 #/blocks.9/self_attn/Concat_output_0$/blocks.9/self_attn/Reshape_output_0/blocks.9/self_attn/Reshape"Reshape* allowzero fonnx::Unsqueeze_2997 Constant_4925"Constant*5 value*)BConstant_4925_attr::valueJ  #/blocks.9/self_attn/Gather_output_0 onnx::Unsqueeze_2997(/blocks.9/self_attn/Unsqueeze_2_output_0/blocks.9/self_attn/Unsqueeze_2" Unsqueeze fonnx::Unsqueeze_2999 Constant_4927"Constant*5 value*)BConstant_4927_attr::valueJ  %/blocks.9/self_attn/Gather_1_output_0 onnx::Unsqueeze_2999(/blocks.9/self_attn/Unsqueeze_3_output_0/blocks.9/self_attn/Unsqueeze_3" Unsqueeze '/blocks.9/self_attn/Constant_4_output_0/blocks.9/self_attn/Constant_4"Constant*F value*:B*/blocks.9/self_attn/Constant_4_attr::valueJ '/blocks.9/self_attn/Constant_5_output_0/blocks.9/self_attn/Constant_5"Constant*F value*:B*/blocks.9/self_attn/Constant_5_attr::valueJ  (/blocks.9/self_attn/Unsqueeze_2_output_0 (/blocks.9/self_attn/Unsqueeze_3_output_0 '/blocks.9/self_attn/Constant_4_output_0 '/blocks.9/self_attn/Constant_5_output_0%/blocks.9/self_attn/Concat_1_output_0/blocks.9/self_attn/Concat_1"Concat* axis fonnx::Unsqueeze_3006 Constant_4932"Constant*5 value*)BConstant_4932_attr::valueJ  #/blocks.9/self_attn/Gather_output_0 onnx::Unsqueeze_3006(/blocks.9/self_attn/Unsqueeze_4_output_0/blocks.9/self_attn/Unsqueeze_4" Unsqueeze fonnx::Unsqueeze_3008 Constant_4934"Constant*5 value*)BConstant_4934_attr::valueJ  %/blocks.9/self_attn/Gather_1_output_0 onnx::Unsqueeze_3008(/blocks.9/self_attn/Unsqueeze_5_output_0/blocks.9/self_attn/Unsqueeze_5" Unsqueeze '/blocks.9/self_attn/Constant_6_output_0/blocks.9/self_attn/Constant_6"Constant*F value*:B*/blocks.9/self_attn/Constant_6_attr::valueJ '/blocks.9/self_attn/Constant_7_output_0/blocks.9/self_attn/Constant_7"Constant*F value*:B*/blocks.9/self_attn/Constant_7_attr::valueJ  (/blocks.9/self_attn/Unsqueeze_4_output_0 (/blocks.9/self_attn/Unsqueeze_5_output_0 '/blocks.9/self_attn/Constant_6_output_0 '/blocks.9/self_attn/Constant_7_output_0%/blocks.9/self_attn/Concat_2_output_0/blocks.9/self_attn/Concat_2"Concat* axis  */blocks.9/self_attn/k_proj/MatMul_output_0 %/blocks.9/self_attn/Concat_1_output_0&/blocks.9/self_attn/Reshape_1_output_0/blocks.9/self_attn/Reshape_1"Reshape* allowzero  */blocks.9/self_attn/v_proj/MatMul_output_0 %/blocks.9/self_attn/Concat_2_output_0&/blocks.9/self_attn/Reshape_2_output_0/blocks.9/self_attn/Reshape_2"Reshape* allowzero  $/blocks.9/self_attn/Reshape_output_0(/blocks.9/self_attn/q_norm/Cast_output_0/blocks.9/self_attn/q_norm/Cast"Cast* to ,/blocks.9/self_attn/q_norm/Constant_output_0#/blocks.9/self_attn/q_norm/Constant"Constant*E value*9B//blocks.9/self_attn/q_norm/Constant_attr::valueJ@  (/blocks.9/self_attn/q_norm/Cast_output_0 ,/blocks.9/self_attn/q_norm/Constant_output_0'/blocks.9/self_attn/q_norm/Pow_output_0/blocks.9/self_attn/q_norm/Pow"Pow  '/blocks.9/self_attn/q_norm/Pow_output_0./blocks.9/self_attn/q_norm/ReduceMean_output_0%/blocks.9/self_attn/q_norm/ReduceMean" ReduceMean* axes@* keepdims ./blocks.9/self_attn/q_norm/Constant_1_output_0%/blocks.9/self_attn/q_norm/Constant_1"Constant*G value*;B1/blocks.9/self_attn/q_norm/Constant_1_attr::valueJ75  ./blocks.9/self_attn/q_norm/ReduceMean_output_0 ./blocks.9/self_attn/q_norm/Constant_1_output_0'/blocks.9/self_attn/q_norm/Add_output_0/blocks.9/self_attn/q_norm/Add"Add z '/blocks.9/self_attn/q_norm/Add_output_0(/blocks.9/self_attn/q_norm/Sqrt_output_0/blocks.9/self_attn/q_norm/Sqrt"Sqrt ./blocks.9/self_attn/q_norm/Constant_2_output_0%/blocks.9/self_attn/q_norm/Constant_2"Constant*G value*;B1/blocks.9/self_attn/q_norm/Constant_2_attr::valueJ?  ./blocks.9/self_attn/q_norm/Constant_2_output_0 (/blocks.9/self_attn/q_norm/Sqrt_output_0'/blocks.9/self_attn/q_norm/Div_output_0/blocks.9/self_attn/q_norm/Div"Div  (/blocks.9/self_attn/q_norm/Cast_output_0*/blocks.9/self_attn/q_norm/Cast_1_output_0!/blocks.9/self_attn/q_norm/Cast_1"Cast* to  */blocks.9/self_attn/q_norm/Cast_1_output_0 '/blocks.9/self_attn/q_norm/Div_output_0'/blocks.9/self_attn/q_norm/Mul_output_0/blocks.9/self_attn/q_norm/Mul"Mul  '/blocks.9/self_attn/q_norm/Mul_output_0 blocks.9.self_attn.q_norm.weight)/blocks.9/self_attn/q_norm/Mul_1_output_0 /blocks.9/self_attn/q_norm/Mul_1"Mul  )/blocks.9/self_attn/q_norm/Mul_1_output_0*/blocks.9/self_attn/q_norm/Cast_2_output_0!/blocks.9/self_attn/q_norm/Cast_2"Cast* to  &/blocks.9/self_attn/Reshape_1_output_0(/blocks.9/self_attn/k_norm/Cast_output_0/blocks.9/self_attn/k_norm/Cast"Cast* to ,/blocks.9/self_attn/k_norm/Constant_output_0#/blocks.9/self_attn/k_norm/Constant"Constant*E value*9B//blocks.9/self_attn/k_norm/Constant_attr::valueJ@  (/blocks.9/self_attn/k_norm/Cast_output_0 ,/blocks.9/self_attn/k_norm/Constant_output_0'/blocks.9/self_attn/k_norm/Pow_output_0/blocks.9/self_attn/k_norm/Pow"Pow  '/blocks.9/self_attn/k_norm/Pow_output_0./blocks.9/self_attn/k_norm/ReduceMean_output_0%/blocks.9/self_attn/k_norm/ReduceMean" ReduceMean* axes@* keepdims ./blocks.9/self_attn/k_norm/Constant_1_output_0%/blocks.9/self_attn/k_norm/Constant_1"Constant*G value*;B1/blocks.9/self_attn/k_norm/Constant_1_attr::valueJ75  ./blocks.9/self_attn/k_norm/ReduceMean_output_0 ./blocks.9/self_attn/k_norm/Constant_1_output_0'/blocks.9/self_attn/k_norm/Add_output_0/blocks.9/self_attn/k_norm/Add"Add z '/blocks.9/self_attn/k_norm/Add_output_0(/blocks.9/self_attn/k_norm/Sqrt_output_0/blocks.9/self_attn/k_norm/Sqrt"Sqrt ./blocks.9/self_attn/k_norm/Constant_2_output_0%/blocks.9/self_attn/k_norm/Constant_2"Constant*G value*;B1/blocks.9/self_attn/k_norm/Constant_2_attr::valueJ?  ./blocks.9/self_attn/k_norm/Constant_2_output_0 (/blocks.9/self_attn/k_norm/Sqrt_output_0'/blocks.9/self_attn/k_norm/Div_output_0/blocks.9/self_attn/k_norm/Div"Div  (/blocks.9/self_attn/k_norm/Cast_output_0*/blocks.9/self_attn/k_norm/Cast_1_output_0!/blocks.9/self_attn/k_norm/Cast_1"Cast* to  */blocks.9/self_attn/k_norm/Cast_1_output_0 '/blocks.9/self_attn/k_norm/Div_output_0'/blocks.9/self_attn/k_norm/Mul_output_0/blocks.9/self_attn/k_norm/Mul"Mul  '/blocks.9/self_attn/k_norm/Mul_output_0 blocks.9.self_attn.k_norm.weight)/blocks.9/self_attn/k_norm/Mul_1_output_0 /blocks.9/self_attn/k_norm/Mul_1"Mul  )/blocks.9/self_attn/k_norm/Mul_1_output_0*/blocks.9/self_attn/k_norm/Cast_2_output_0!/blocks.9/self_attn/k_norm/Cast_2"Cast* to  */blocks.9/self_attn/q_norm/Cast_2_output_0 %/blocks.0/self_attn/Gather_2_output_0 /blocks.9/self_attn/Mul_output_0/blocks.9/self_attn/Mul"Mul v */blocks.9/self_attn/q_norm/Cast_2_output_0$/blocks.9/self_attn/Shape_2_output_0/blocks.9/self_attn/Shape_2"Shape '/blocks.9/self_attn/Constant_8_output_0/blocks.9/self_attn/Constant_8"Constant*D value*8B*/blocks.9/self_attn/Constant_8_attr::valueJ  $/blocks.9/self_attn/Shape_2_output_0 '/blocks.9/self_attn/Constant_8_output_0%/blocks.9/self_attn/Gather_2_output_0/blocks.9/self_attn/Gather_2"Gather* axis '/blocks.9/self_attn/Constant_9_output_0/blocks.9/self_attn/Constant_9"Constant*D value*8B*/blocks.9/self_attn/Constant_9_attr::valueJ  %/blocks.9/self_attn/Gather_2_output_0 '/blocks.9/self_attn/Constant_9_output_0 /blocks.9/self_attn/Div_output_0/blocks.9/self_attn/Div"Div p /blocks.9/self_attn/Div_output_0!/blocks.9/self_attn/Cast_output_0/blocks.9/self_attn/Cast"Cast* to u !/blocks.9/self_attn/Cast_output_0#/blocks.9/self_attn/Cast_1_output_0/blocks.9/self_attn/Cast_1"Cast* to (/blocks.9/self_attn/Constant_10_output_0/blocks.9/self_attn/Constant_10"Constant*G value*;B+/blocks.9/self_attn/Constant_10_attr::valueJ (/blocks.9/self_attn/Constant_11_output_0/blocks.9/self_attn/Constant_11"Constant*G value*;B+/blocks.9/self_attn/Constant_11_attr::valueJ (/blocks.9/self_attn/Constant_12_output_0/blocks.9/self_attn/Constant_12"Constant*G value*;B+/blocks.9/self_attn/Constant_12_attr::valueJ  #/blocks.9/self_attn/Cast_1_output_0 (/blocks.9/self_attn/Constant_12_output_0(/blocks.9/self_attn/Unsqueeze_6_output_0/blocks.9/self_attn/Unsqueeze_6" Unsqueeze (/blocks.9/self_attn/Constant_13_output_0/blocks.9/self_attn/Constant_13"Constant*G value*;B+/blocks.9/self_attn/Constant_13_attr::valueJ  */blocks.9/self_attn/q_norm/Cast_2_output_0 (/blocks.9/self_attn/Constant_11_output_0 (/blocks.9/self_attn/Unsqueeze_6_output_0 (/blocks.9/self_attn/Constant_10_output_0 (/blocks.9/self_attn/Constant_13_output_0"/blocks.9/self_attn/Slice_output_0/blocks.9/self_attn/Slice"Slice (/blocks.9/self_attn/Constant_14_output_0/blocks.9/self_attn/Constant_14"Constant*G value*;B+/blocks.9/self_attn/Constant_14_attr::valueJ (/blocks.9/self_attn/Constant_15_output_0/blocks.9/self_attn/Constant_15"Constant*G value*;B+/blocks.9/self_attn/Constant_15_attr::valueJ  #/blocks.9/self_attn/Cast_1_output_0 (/blocks.9/self_attn/Constant_15_output_0(/blocks.9/self_attn/Unsqueeze_7_output_0/blocks.9/self_attn/Unsqueeze_7" Unsqueeze (/blocks.9/self_attn/Constant_16_output_0/blocks.9/self_attn/Constant_16"Constant*G value*;B+/blocks.9/self_attn/Constant_16_attr::valueJ (/blocks.9/self_attn/Constant_17_output_0/blocks.9/self_attn/Constant_17"Constant*G value*;B+/blocks.9/self_attn/Constant_17_attr::valueJ  */blocks.9/self_attn/q_norm/Cast_2_output_0 (/blocks.9/self_attn/Unsqueeze_7_output_0 (/blocks.9/self_attn/Constant_16_output_0 (/blocks.9/self_attn/Constant_14_output_0 (/blocks.9/self_attn/Constant_17_output_0$/blocks.9/self_attn/Slice_1_output_0/blocks.9/self_attn/Slice_1"Slice f $/blocks.9/self_attn/Slice_1_output_0 /blocks.9/self_attn/Neg_output_0/blocks.9/self_attn/Neg"Neg  /blocks.9/self_attn/Neg_output_0 "/blocks.9/self_attn/Slice_output_0%/blocks.9/self_attn/Concat_3_output_0/blocks.9/self_attn/Concat_3"Concat* axis  %/blocks.9/self_attn/Concat_3_output_0 %/blocks.0/self_attn/Gather_3_output_0"/blocks.9/self_attn/Mul_1_output_0/blocks.9/self_attn/Mul_1"Mul  /blocks.9/self_attn/Mul_output_0 "/blocks.9/self_attn/Mul_1_output_0 /blocks.9/self_attn/Add_output_0/blocks.9/self_attn/Add"Add  */blocks.9/self_attn/k_norm/Cast_2_output_0 %/blocks.0/self_attn/Gather_2_output_0"/blocks.9/self_attn/Mul_2_output_0/blocks.9/self_attn/Mul_2"Mul v */blocks.9/self_attn/k_norm/Cast_2_output_0$/blocks.9/self_attn/Shape_3_output_0/blocks.9/self_attn/Shape_3"Shape (/blocks.9/self_attn/Constant_18_output_0/blocks.9/self_attn/Constant_18"Constant*E value*9B+/blocks.9/self_attn/Constant_18_attr::valueJ  $/blocks.9/self_attn/Shape_3_output_0 (/blocks.9/self_attn/Constant_18_output_0%/blocks.9/self_attn/Gather_3_output_0/blocks.9/self_attn/Gather_3"Gather* axis (/blocks.9/self_attn/Constant_19_output_0/blocks.9/self_attn/Constant_19"Constant*E value*9B+/blocks.9/self_attn/Constant_19_attr::valueJ  %/blocks.9/self_attn/Gather_3_output_0 (/blocks.9/self_attn/Constant_19_output_0"/blocks.9/self_attn/Div_1_output_0/blocks.9/self_attn/Div_1"Div v "/blocks.9/self_attn/Div_1_output_0#/blocks.9/self_attn/Cast_2_output_0/blocks.9/self_attn/Cast_2"Cast* to w #/blocks.9/self_attn/Cast_2_output_0#/blocks.9/self_attn/Cast_3_output_0/blocks.9/self_attn/Cast_3"Cast* to (/blocks.9/self_attn/Constant_20_output_0/blocks.9/self_attn/Constant_20"Constant*G value*;B+/blocks.9/self_attn/Constant_20_attr::valueJ (/blocks.9/self_attn/Constant_21_output_0/blocks.9/self_attn/Constant_21"Constant*G value*;B+/blocks.9/self_attn/Constant_21_attr::valueJ (/blocks.9/self_attn/Constant_22_output_0/blocks.9/self_attn/Constant_22"Constant*G value*;B+/blocks.9/self_attn/Constant_22_attr::valueJ  #/blocks.9/self_attn/Cast_3_output_0 (/blocks.9/self_attn/Constant_22_output_0(/blocks.9/self_attn/Unsqueeze_8_output_0/blocks.9/self_attn/Unsqueeze_8" Unsqueeze (/blocks.9/self_attn/Constant_23_output_0/blocks.9/self_attn/Constant_23"Constant*G value*;B+/blocks.9/self_attn/Constant_23_attr::valueJ  */blocks.9/self_attn/k_norm/Cast_2_output_0 (/blocks.9/self_attn/Constant_21_output_0 (/blocks.9/self_attn/Unsqueeze_8_output_0 (/blocks.9/self_attn/Constant_20_output_0 (/blocks.9/self_attn/Constant_23_output_0$/blocks.9/self_attn/Slice_2_output_0/blocks.9/self_attn/Slice_2"Slice (/blocks.9/self_attn/Constant_24_output_0/blocks.9/self_attn/Constant_24"Constant*G value*;B+/blocks.9/self_attn/Constant_24_attr::valueJ (/blocks.9/self_attn/Constant_25_output_0/blocks.9/self_attn/Constant_25"Constant*G value*;B+/blocks.9/self_attn/Constant_25_attr::valueJ  #/blocks.9/self_attn/Cast_3_output_0 (/blocks.9/self_attn/Constant_25_output_0(/blocks.9/self_attn/Unsqueeze_9_output_0/blocks.9/self_attn/Unsqueeze_9" Unsqueeze (/blocks.9/self_attn/Constant_26_output_0/blocks.9/self_attn/Constant_26"Constant*G value*;B+/blocks.9/self_attn/Constant_26_attr::valueJ (/blocks.9/self_attn/Constant_27_output_0/blocks.9/self_attn/Constant_27"Constant*G value*;B+/blocks.9/self_attn/Constant_27_attr::valueJ  */blocks.9/self_attn/k_norm/Cast_2_output_0 (/blocks.9/self_attn/Unsqueeze_9_output_0 (/blocks.9/self_attn/Constant_26_output_0 (/blocks.9/self_attn/Constant_24_output_0 (/blocks.9/self_attn/Constant_27_output_0$/blocks.9/self_attn/Slice_3_output_0/blocks.9/self_attn/Slice_3"Slice j $/blocks.9/self_attn/Slice_3_output_0"/blocks.9/self_attn/Neg_1_output_0/blocks.9/self_attn/Neg_1"Neg  "/blocks.9/self_attn/Neg_1_output_0 $/blocks.9/self_attn/Slice_2_output_0%/blocks.9/self_attn/Concat_4_output_0/blocks.9/self_attn/Concat_4"Concat* axis  %/blocks.9/self_attn/Concat_4_output_0 %/blocks.0/self_attn/Gather_3_output_0"/blocks.9/self_attn/Mul_3_output_0/blocks.9/self_attn/Mul_3"Mul  "/blocks.9/self_attn/Mul_2_output_0 "/blocks.9/self_attn/Mul_3_output_0"/blocks.9/self_attn/Add_1_output_0/blocks.9/self_attn/Add_1"Add  /Gather_9_output_0 /rotary/Constant_3_output_0%/blocks.9/self_attn/Gather_4_output_0/blocks.9/self_attn/Gather_4"Gather* axis  /Gather_9_output_0 /rotary/Constant_8_output_0%/blocks.9/self_attn/Gather_5_output_0/blocks.9/self_attn/Gather_5"Gather* axis  %/blocks.9/self_attn/Gather_4_output_0 "/blocks.9/self_attn/Add_1_output_0%/blocks.9/self_attn/Concat_5_output_0/blocks.9/self_attn/Concat_5"Concat* axis  %/blocks.9/self_attn/Gather_5_output_0 &/blocks.9/self_attn/Reshape_2_output_0%/blocks.9/self_attn/Concat_6_output_0/blocks.9/self_attn/Concat_6"Concat* axis (/blocks.9/self_attn/Constant_28_output_0/blocks.9/self_attn/Constant_28"Constant*G value*;B+/blocks.9/self_attn/Constant_28_attr::valueJ  %/blocks.9/self_attn/Concat_5_output_0 (/blocks.9/self_attn/Constant_28_output_0)/blocks.9/self_attn/Unsqueeze_10_output_0 /blocks.9/self_attn/Unsqueeze_10" Unsqueeze (/blocks.9/self_attn/Constant_29_output_0/blocks.9/self_attn/Constant_29"Constant*G value*;B+/blocks.9/self_attn/Constant_29_attr::valueJ  %/blocks.9/self_attn/Concat_6_output_0 (/blocks.9/self_attn/Constant_29_output_0)/blocks.9/self_attn/Unsqueeze_11_output_0 /blocks.9/self_attn/Unsqueeze_11" Unsqueeze  )/blocks.9/self_attn/Unsqueeze_10_output_0 )/blocks.9/self_attn/Unsqueeze_11_output_0%/blocks.9/self_attn/Concat_7_output_0/blocks.9/self_attn/Concat_7"Concat* axis  /blocks.9/self_attn/Add_output_0&/blocks.9/self_attn/Transpose_output_0/blocks.9/self_attn/Transpose" Transpose* perm@@@@  %/blocks.9/self_attn/Concat_5_output_0(/blocks.9/self_attn/Transpose_1_output_0/blocks.9/self_attn/Transpose_1" Transpose* perm@@@@  %/blocks.9/self_attn/Concat_6_output_0(/blocks.9/self_attn/Transpose_2_output_0/blocks.9/self_attn/Transpose_2" Transpose* perm@@@@ t (/blocks.9/self_attn/Transpose_1_output_0$/blocks.9/self_attn/Shape_4_output_0/blocks.9/self_attn/Shape_4"Shape (/blocks.9/self_attn/Constant_30_output_0/blocks.9/self_attn/Constant_30"Constant*E value*9B+/blocks.9/self_attn/Constant_30_attr::valueJ  $/blocks.9/self_attn/Shape_4_output_0 (/blocks.9/self_attn/Constant_30_output_0%/blocks.9/self_attn/Gather_6_output_0/blocks.9/self_attn/Gather_6"Gather* axis t (/blocks.9/self_attn/Transpose_1_output_0$/blocks.9/self_attn/Shape_5_output_0/blocks.9/self_attn/Shape_5"Shape (/blocks.9/self_attn/Constant_31_output_0/blocks.9/self_attn/Constant_31"Constant*E value*9B+/blocks.9/self_attn/Constant_31_attr::valueJ  $/blocks.9/self_attn/Shape_5_output_0 (/blocks.9/self_attn/Constant_31_output_0%/blocks.9/self_attn/Gather_7_output_0/blocks.9/self_attn/Gather_7"Gather* axis t (/blocks.9/self_attn/Transpose_1_output_0$/blocks.9/self_attn/Shape_6_output_0/blocks.9/self_attn/Shape_6"Shape (/blocks.9/self_attn/Constant_32_output_0/blocks.9/self_attn/Constant_32"Constant*E value*9B+/blocks.9/self_attn/Constant_32_attr::valueJ  $/blocks.9/self_attn/Shape_6_output_0 (/blocks.9/self_attn/Constant_32_output_0%/blocks.9/self_attn/Gather_8_output_0/blocks.9/self_attn/Gather_8"Gather* axis t (/blocks.9/self_attn/Transpose_1_output_0$/blocks.9/self_attn/Shape_7_output_0/blocks.9/self_attn/Shape_7"Shape (/blocks.9/self_attn/Constant_33_output_0/blocks.9/self_attn/Constant_33"Constant*E value*9B+/blocks.9/self_attn/Constant_33_attr::valueJ  $/blocks.9/self_attn/Shape_7_output_0 (/blocks.9/self_attn/Constant_33_output_0%/blocks.9/self_attn/Gather_9_output_0/blocks.9/self_attn/Gather_9"Gather* axis (/blocks.9/self_attn/Constant_34_output_0/blocks.9/self_attn/Constant_34"Constant*G value*;B+/blocks.9/self_attn/Constant_34_attr::valueJ  (/blocks.9/self_attn/Transpose_1_output_0 (/blocks.9/self_attn/Constant_34_output_0)/blocks.9/self_attn/Unsqueeze_12_output_0 /blocks.9/self_attn/Unsqueeze_12" Unsqueeze (/blocks.9/self_attn/Constant_35_output_0/blocks.9/self_attn/Constant_35"Constant*G value*;B+/blocks.9/self_attn/Constant_35_attr::valueJ  %/blocks.9/self_attn/Gather_6_output_0 (/blocks.9/self_attn/Constant_35_output_0)/blocks.9/self_attn/Unsqueeze_13_output_0 /blocks.9/self_attn/Unsqueeze_13" Unsqueeze (/blocks.9/self_attn/Constant_36_output_0/blocks.9/self_attn/Constant_36"Constant*G value*;B+/blocks.9/self_attn/Constant_36_attr::valueJ  %/blocks.9/self_attn/Gather_7_output_0 (/blocks.9/self_attn/Constant_36_output_0)/blocks.9/self_attn/Unsqueeze_14_output_0 /blocks.9/self_attn/Unsqueeze_14" Unsqueeze (/blocks.9/self_attn/Constant_37_output_0/blocks.9/self_attn/Constant_37"Constant*G value*;B+/blocks.9/self_attn/Constant_37_attr::valueJ (/blocks.9/self_attn/Constant_38_output_0/blocks.9/self_attn/Constant_38"Constant*G value*;B+/blocks.9/self_attn/Constant_38_attr::valueJ  %/blocks.9/self_attn/Gather_8_output_0 (/blocks.9/self_attn/Constant_38_output_0)/blocks.9/self_attn/Unsqueeze_15_output_0 /blocks.9/self_attn/Unsqueeze_15" Unsqueeze (/blocks.9/self_attn/Constant_39_output_0/blocks.9/self_attn/Constant_39"Constant*G value*;B+/blocks.9/self_attn/Constant_39_attr::valueJ  %/blocks.9/self_attn/Gather_9_output_0 (/blocks.9/self_attn/Constant_39_output_0)/blocks.9/self_attn/Unsqueeze_16_output_0 /blocks.9/self_attn/Unsqueeze_16" Unsqueeze  )/blocks.9/self_attn/Unsqueeze_13_output_0 )/blocks.9/self_attn/Unsqueeze_14_output_0 (/blocks.9/self_attn/Constant_37_output_0 )/blocks.9/self_attn/Unsqueeze_15_output_0 )/blocks.9/self_attn/Unsqueeze_16_output_0%/blocks.9/self_attn/Concat_8_output_0/blocks.9/self_attn/Concat_8"Concat* axis (/blocks.9/self_attn/Constant_40_output_0/blocks.9/self_attn/Constant_40"Constant*G value*;B+/blocks.9/self_attn/Constant_40_attr::valueJ  %/blocks.9/self_attn/Concat_8_output_0 (/blocks.9/self_attn/Constant_40_output_0&/blocks.9/self_attn/Reshape_3_output_0/blocks.9/self_attn/Reshape_3"Reshape* allowzero r &/blocks.9/self_attn/Reshape_3_output_0$/blocks.9/self_attn/Shape_8_output_0/blocks.9/self_attn/Shape_8"Shape  $/blocks.9/self_attn/Shape_8_output_0,/blocks.9/self_attn/ConstantOfShape_output_0#/blocks.9/self_attn/ConstantOfShape"ConstantOfShape*K value*?B//blocks.9/self_attn/ConstantOfShape_attr::valueJ (/blocks.9/self_attn/Constant_41_output_0/blocks.9/self_attn/Constant_41"Constant*E value*9B+/blocks.9/self_attn/Constant_41_attr::valueJ  ,/blocks.9/self_attn/ConstantOfShape_output_0 (/blocks.9/self_attn/Constant_41_output_0"/blocks.9/self_attn/Mul_4_output_0/blocks.9/self_attn/Mul_4"Mul  &/blocks.9/self_attn/Reshape_3_output_0 "/blocks.9/self_attn/Mul_4_output_0"/blocks.9/self_attn/Equal_output_0/blocks.9/self_attn/Equal"Equal  "/blocks.9/self_attn/Equal_output_0 ,/blocks.9/self_attn/ConstantOfShape_output_0 &/blocks.9/self_attn/Reshape_3_output_0"/blocks.9/self_attn/Where_output_0/blocks.9/self_attn/Where"Where  )/blocks.9/self_attn/Unsqueeze_12_output_0 "/blocks.9/self_attn/Where_output_0#/blocks.9/self_attn/Expand_output_0/blocks.9/self_attn/Expand"Expand (/blocks.9/self_attn/Constant_42_output_0/blocks.9/self_attn/Constant_42"Constant*E value*9B+/blocks.9/self_attn/Constant_42_attr::valueJ  %/blocks.9/self_attn/Gather_7_output_0 (/blocks.9/self_attn/Constant_42_output_0"/blocks.9/self_attn/Mul_5_output_0/blocks.9/self_attn/Mul_5"Mul fonnx::Unsqueeze_3151 Constant_5062"Constant*5 value*)BConstant_5062_attr::valueJ  %/blocks.9/self_attn/Gather_6_output_0 onnx::Unsqueeze_3151)/blocks.9/self_attn/Unsqueeze_17_output_0 /blocks.9/self_attn/Unsqueeze_17" Unsqueeze fonnx::Unsqueeze_3153 Constant_5064"Constant*5 value*)BConstant_5064_attr::valueJ  "/blocks.9/self_attn/Mul_5_output_0 onnx::Unsqueeze_3153)/blocks.9/self_attn/Unsqueeze_18_output_0 /blocks.9/self_attn/Unsqueeze_18" Unsqueeze fonnx::Unsqueeze_3155 Constant_5066"Constant*5 value*)BConstant_5066_attr::valueJ  %/blocks.9/self_attn/Gather_8_output_0 onnx::Unsqueeze_3155)/blocks.9/self_attn/Unsqueeze_19_output_0 /blocks.9/self_attn/Unsqueeze_19" Unsqueeze fonnx::Unsqueeze_3157 Constant_5068"Constant*5 value*)BConstant_5068_attr::valueJ  %/blocks.9/self_attn/Gather_9_output_0 onnx::Unsqueeze_3157)/blocks.9/self_attn/Unsqueeze_20_output_0 /blocks.9/self_attn/Unsqueeze_20" Unsqueeze  )/blocks.9/self_attn/Unsqueeze_17_output_0 )/blocks.9/self_attn/Unsqueeze_18_output_0 )/blocks.9/self_attn/Unsqueeze_19_output_0 )/blocks.9/self_attn/Unsqueeze_20_output_0%/blocks.9/self_attn/Concat_9_output_0/blocks.9/self_attn/Concat_9"Concat* axis  #/blocks.9/self_attn/Expand_output_0 %/blocks.9/self_attn/Concat_9_output_0&/blocks.9/self_attn/Reshape_4_output_0/blocks.9/self_attn/Reshape_4"Reshape* allowzero t (/blocks.9/self_attn/Transpose_2_output_0$/blocks.9/self_attn/Shape_9_output_0/blocks.9/self_attn/Shape_9"Shape (/blocks.9/self_attn/Constant_43_output_0/blocks.9/self_attn/Constant_43"Constant*E value*9B+/blocks.9/self_attn/Constant_43_attr::valueJ  $/blocks.9/self_attn/Shape_9_output_0 (/blocks.9/self_attn/Constant_43_output_0&/blocks.9/self_attn/Gather_10_output_0/blocks.9/self_attn/Gather_10"Gather* axis v (/blocks.9/self_attn/Transpose_2_output_0%/blocks.9/self_attn/Shape_10_output_0/blocks.9/self_attn/Shape_10"Shape (/blocks.9/self_attn/Constant_44_output_0/blocks.9/self_attn/Constant_44"Constant*E value*9B+/blocks.9/self_attn/Constant_44_attr::valueJ  %/blocks.9/self_attn/Shape_10_output_0 (/blocks.9/self_attn/Constant_44_output_0&/blocks.9/self_attn/Gather_11_output_0/blocks.9/self_attn/Gather_11"Gather* axis v (/blocks.9/self_attn/Transpose_2_output_0%/blocks.9/self_attn/Shape_11_output_0/blocks.9/self_attn/Shape_11"Shape (/blocks.9/self_attn/Constant_45_output_0/blocks.9/self_attn/Constant_45"Constant*E value*9B+/blocks.9/self_attn/Constant_45_attr::valueJ  %/blocks.9/self_attn/Shape_11_output_0 (/blocks.9/self_attn/Constant_45_output_0&/blocks.9/self_attn/Gather_12_output_0/blocks.9/self_attn/Gather_12"Gather* axis v (/blocks.9/self_attn/Transpose_2_output_0%/blocks.9/self_attn/Shape_12_output_0/blocks.9/self_attn/Shape_12"Shape (/blocks.9/self_attn/Constant_46_output_0/blocks.9/self_attn/Constant_46"Constant*E value*9B+/blocks.9/self_attn/Constant_46_attr::valueJ  %/blocks.9/self_attn/Shape_12_output_0 (/blocks.9/self_attn/Constant_46_output_0&/blocks.9/self_attn/Gather_13_output_0/blocks.9/self_attn/Gather_13"Gather* axis (/blocks.9/self_attn/Constant_47_output_0/blocks.9/self_attn/Constant_47"Constant*G value*;B+/blocks.9/self_attn/Constant_47_attr::valueJ  (/blocks.9/self_attn/Transpose_2_output_0 (/blocks.9/self_attn/Constant_47_output_0)/blocks.9/self_attn/Unsqueeze_21_output_0 /blocks.9/self_attn/Unsqueeze_21" Unsqueeze (/blocks.9/self_attn/Constant_48_output_0/blocks.9/self_attn/Constant_48"Constant*G value*;B+/blocks.9/self_attn/Constant_48_attr::valueJ  &/blocks.9/self_attn/Gather_10_output_0 (/blocks.9/self_attn/Constant_48_output_0)/blocks.9/self_attn/Unsqueeze_22_output_0 /blocks.9/self_attn/Unsqueeze_22" Unsqueeze (/blocks.9/self_attn/Constant_49_output_0/blocks.9/self_attn/Constant_49"Constant*G value*;B+/blocks.9/self_attn/Constant_49_attr::valueJ  &/blocks.9/self_attn/Gather_11_output_0 (/blocks.9/self_attn/Constant_49_output_0)/blocks.9/self_attn/Unsqueeze_23_output_0 /blocks.9/self_attn/Unsqueeze_23" Unsqueeze (/blocks.9/self_attn/Constant_50_output_0/blocks.9/self_attn/Constant_50"Constant*G value*;B+/blocks.9/self_attn/Constant_50_attr::valueJ (/blocks.9/self_attn/Constant_51_output_0/blocks.9/self_attn/Constant_51"Constant*G value*;B+/blocks.9/self_attn/Constant_51_attr::valueJ  &/blocks.9/self_attn/Gather_12_output_0 (/blocks.9/self_attn/Constant_51_output_0)/blocks.9/self_attn/Unsqueeze_24_output_0 /blocks.9/self_attn/Unsqueeze_24" Unsqueeze (/blocks.9/self_attn/Constant_52_output_0/blocks.9/self_attn/Constant_52"Constant*G value*;B+/blocks.9/self_attn/Constant_52_attr::valueJ  &/blocks.9/self_attn/Gather_13_output_0 (/blocks.9/self_attn/Constant_52_output_0)/blocks.9/self_attn/Unsqueeze_25_output_0 /blocks.9/self_attn/Unsqueeze_25" Unsqueeze  )/blocks.9/self_attn/Unsqueeze_22_output_0 )/blocks.9/self_attn/Unsqueeze_23_output_0 (/blocks.9/self_attn/Constant_50_output_0 )/blocks.9/self_attn/Unsqueeze_24_output_0 )/blocks.9/self_attn/Unsqueeze_25_output_0&/blocks.9/self_attn/Concat_10_output_0/blocks.9/self_attn/Concat_10"Concat* axis (/blocks.9/self_attn/Constant_53_output_0/blocks.9/self_attn/Constant_53"Constant*G value*;B+/blocks.9/self_attn/Constant_53_attr::valueJ  &/blocks.9/self_attn/Concat_10_output_0 (/blocks.9/self_attn/Constant_53_output_0&/blocks.9/self_attn/Reshape_5_output_0/blocks.9/self_attn/Reshape_5"Reshape* allowzero t &/blocks.9/self_attn/Reshape_5_output_0%/blocks.9/self_attn/Shape_13_output_0/blocks.9/self_attn/Shape_13"Shape  %/blocks.9/self_attn/Shape_13_output_0./blocks.9/self_attn/ConstantOfShape_1_output_0%/blocks.9/self_attn/ConstantOfShape_1"ConstantOfShape*M value*AB1/blocks.9/self_attn/ConstantOfShape_1_attr::valueJ (/blocks.9/self_attn/Constant_54_output_0/blocks.9/self_attn/Constant_54"Constant*E value*9B+/blocks.9/self_attn/Constant_54_attr::valueJ  ./blocks.9/self_attn/ConstantOfShape_1_output_0 (/blocks.9/self_attn/Constant_54_output_0"/blocks.9/self_attn/Mul_6_output_0/blocks.9/self_attn/Mul_6"Mul  &/blocks.9/self_attn/Reshape_5_output_0 "/blocks.9/self_attn/Mul_6_output_0$/blocks.9/self_attn/Equal_1_output_0/blocks.9/self_attn/Equal_1"Equal  $/blocks.9/self_attn/Equal_1_output_0 ./blocks.9/self_attn/ConstantOfShape_1_output_0 &/blocks.9/self_attn/Reshape_5_output_0$/blocks.9/self_attn/Where_1_output_0/blocks.9/self_attn/Where_1"Where  )/blocks.9/self_attn/Unsqueeze_21_output_0 $/blocks.9/self_attn/Where_1_output_0%/blocks.9/self_attn/Expand_1_output_0/blocks.9/self_attn/Expand_1"Expand (/blocks.9/self_attn/Constant_55_output_0/blocks.9/self_attn/Constant_55"Constant*E value*9B+/blocks.9/self_attn/Constant_55_attr::valueJ  &/blocks.9/self_attn/Gather_11_output_0 (/blocks.9/self_attn/Constant_55_output_0"/blocks.9/self_attn/Mul_7_output_0/blocks.9/self_attn/Mul_7"Mul fonnx::Unsqueeze_3197 Constant_5107"Constant*5 value*)BConstant_5107_attr::valueJ  &/blocks.9/self_attn/Gather_10_output_0 onnx::Unsqueeze_3197)/blocks.9/self_attn/Unsqueeze_26_output_0 /blocks.9/self_attn/Unsqueeze_26" Unsqueeze fonnx::Unsqueeze_3199 Constant_5109"Constant*5 value*)BConstant_5109_attr::valueJ  "/blocks.9/self_attn/Mul_7_output_0 onnx::Unsqueeze_3199)/blocks.9/self_attn/Unsqueeze_27_output_0 /blocks.9/self_attn/Unsqueeze_27" Unsqueeze fonnx::Unsqueeze_3201 Constant_5111"Constant*5 value*)BConstant_5111_attr::valueJ  &/blocks.9/self_attn/Gather_12_output_0 onnx::Unsqueeze_3201)/blocks.9/self_attn/Unsqueeze_28_output_0 /blocks.9/self_attn/Unsqueeze_28" Unsqueeze fonnx::Unsqueeze_3203 Constant_5113"Constant*5 value*)BConstant_5113_attr::valueJ  &/blocks.9/self_attn/Gather_13_output_0 onnx::Unsqueeze_3203)/blocks.9/self_attn/Unsqueeze_29_output_0 /blocks.9/self_attn/Unsqueeze_29" Unsqueeze  )/blocks.9/self_attn/Unsqueeze_26_output_0 )/blocks.9/self_attn/Unsqueeze_27_output_0 )/blocks.9/self_attn/Unsqueeze_28_output_0 )/blocks.9/self_attn/Unsqueeze_29_output_0&/blocks.9/self_attn/Concat_11_output_0/blocks.9/self_attn/Concat_11"Concat* axis  %/blocks.9/self_attn/Expand_1_output_0 &/blocks.9/self_attn/Concat_11_output_0&/blocks.9/self_attn/Reshape_6_output_0/blocks.9/self_attn/Reshape_6"Reshape* allowzero  &/blocks.9/self_attn/Transpose_output_0 &/blocks.9/self_attn/Reshape_4_output_0#/blocks.9/self_attn/MatMul_output_0/blocks.9/self_attn/MatMul"MatMul (/blocks.9/self_attn/Constant_56_output_0/blocks.9/self_attn/Constant_56"Constant*A value*5B+/blocks.9/self_attn/Constant_56_attr::valueJ5A  #/blocks.9/self_attn/MatMul_output_0 (/blocks.9/self_attn/Constant_56_output_0"/blocks.9/self_attn/Div_2_output_0/blocks.9/self_attn/Div_2"Div x "/blocks.9/self_attn/Div_2_output_0 attention_mask"/blocks.9/self_attn/Add_2_output_0/blocks.9/self_attn/Add_2"Add  "/blocks.9/self_attn/Add_2_output_0$/blocks.9/self_attn/Softmax_output_0/blocks.9/self_attn/Softmax"Softmax* axis x $/blocks.9/self_attn/Softmax_output_0#/blocks.9/self_attn/Cast_4_output_0/blocks.9/self_attn/Cast_4"Cast* to  #/blocks.9/self_attn/Cast_4_output_0 &/blocks.9/self_attn/Reshape_6_output_0%/blocks.9/self_attn/MatMul_1_output_0/blocks.9/self_attn/MatMul_1"MatMul  %/blocks.9/self_attn/MatMul_1_output_0(/blocks.9/self_attn/Transpose_3_output_0/blocks.9/self_attn/Transpose_3" Transpose* perm@@@@ fonnx::Unsqueeze_3215 Constant_5125"Constant*5 value*)BConstant_5125_attr::valueJ  #/blocks.9/self_attn/Gather_output_0 onnx::Unsqueeze_3215)/blocks.9/self_attn/Unsqueeze_30_output_0 /blocks.9/self_attn/Unsqueeze_30" Unsqueeze fonnx::Unsqueeze_3217 Constant_5127"Constant*5 value*)BConstant_5127_attr::valueJ  %/blocks.9/self_attn/Gather_1_output_0 onnx::Unsqueeze_3217)/blocks.9/self_attn/Unsqueeze_31_output_0 /blocks.9/self_attn/Unsqueeze_31" Unsqueeze (/blocks.9/self_attn/Constant_57_output_0/blocks.9/self_attn/Constant_57"Constant*G value*;B+/blocks.9/self_attn/Constant_57_attr::valueJ  )/blocks.9/self_attn/Unsqueeze_30_output_0 )/blocks.9/self_attn/Unsqueeze_31_output_0 (/blocks.9/self_attn/Constant_57_output_0&/blocks.9/self_attn/Concat_12_output_0/blocks.9/self_attn/Concat_12"Concat* axis  (/blocks.9/self_attn/Transpose_3_output_0 &/blocks.9/self_attn/Concat_12_output_0&/blocks.9/self_attn/Reshape_7_output_0/blocks.9/self_attn/Reshape_7"Reshape* allowzero  &/blocks.9/self_attn/Reshape_7_output_0 onnx::MatMul_8841*/blocks.9/self_attn/o_proj/MatMul_output_0!/blocks.9/self_attn/o_proj/MatMul"MatMul  )/blocks.9/input_layernorm/Cast_1_output_0 */blocks.9/self_attn/o_proj/MatMul_output_0/blocks.9/Add_output_0 /blocks.9/Add"Add  /blocks.9/Add_output_00/blocks.9/post_attention_layernorm/Cast_output_0'/blocks.9/post_attention_layernorm/Cast"Cast* to 4/blocks.9/post_attention_layernorm/Constant_output_0+/blocks.9/post_attention_layernorm/Constant"Constant*M value*AB7/blocks.9/post_attention_layernorm/Constant_attr::valueJ@  0/blocks.9/post_attention_layernorm/Cast_output_0 4/blocks.9/post_attention_layernorm/Constant_output_0//blocks.9/post_attention_layernorm/Pow_output_0&/blocks.9/post_attention_layernorm/Pow"Pow  //blocks.9/post_attention_layernorm/Pow_output_06/blocks.9/post_attention_layernorm/ReduceMean_output_0-/blocks.9/post_attention_layernorm/ReduceMean" ReduceMean* axes@* keepdims 6/blocks.9/post_attention_layernorm/Constant_1_output_0-/blocks.9/post_attention_layernorm/Constant_1"Constant*O value*CB9/blocks.9/post_attention_layernorm/Constant_1_attr::valueJ75  6/blocks.9/post_attention_layernorm/ReduceMean_output_0 6/blocks.9/post_attention_layernorm/Constant_1_output_0//blocks.9/post_attention_layernorm/Add_output_0&/blocks.9/post_attention_layernorm/Add"Add  //blocks.9/post_attention_layernorm/Add_output_00/blocks.9/post_attention_layernorm/Sqrt_output_0'/blocks.9/post_attention_layernorm/Sqrt"Sqrt 6/blocks.9/post_attention_layernorm/Constant_2_output_0-/blocks.9/post_attention_layernorm/Constant_2"Constant*O value*CB9/blocks.9/post_attention_layernorm/Constant_2_attr::valueJ?  6/blocks.9/post_attention_layernorm/Constant_2_output_0 0/blocks.9/post_attention_layernorm/Sqrt_output_0//blocks.9/post_attention_layernorm/Div_output_0&/blocks.9/post_attention_layernorm/Div"Div  0/blocks.9/post_attention_layernorm/Cast_output_02/blocks.9/post_attention_layernorm/Cast_1_output_0)/blocks.9/post_attention_layernorm/Cast_1"Cast* to  2/blocks.9/post_attention_layernorm/Cast_1_output_0 //blocks.9/post_attention_layernorm/Div_output_0//blocks.9/post_attention_layernorm/Mul_output_0&/blocks.9/post_attention_layernorm/Mul"Mul  //blocks.9/post_attention_layernorm/Mul_output_0 (blocks.9.post_attention_layernorm.weight1/blocks.9/post_attention_layernorm/Mul_1_output_0(/blocks.9/post_attention_layernorm/Mul_1"Mul  1/blocks.9/post_attention_layernorm/Mul_1_output_02/blocks.9/post_attention_layernorm/Cast_2_output_0)/blocks.9/post_attention_layernorm/Cast_2"Cast* to  2/blocks.9/post_attention_layernorm/Cast_2_output_0 onnx::MatMul_8842'/blocks.9/mlp/gate_proj/MatMul_output_0/blocks.9/mlp/gate_proj/MatMul"MatMul w '/blocks.9/mlp/gate_proj/MatMul_output_0%/blocks.9/mlp/act_fn/Sigmoid_output_0/blocks.9/mlp/act_fn/Sigmoid"Sigmoid  '/blocks.9/mlp/gate_proj/MatMul_output_0 %/blocks.9/mlp/act_fn/Sigmoid_output_0!/blocks.9/mlp/act_fn/Mul_output_0/blocks.9/mlp/act_fn/Mul"Mul  2/blocks.9/post_attention_layernorm/Cast_2_output_0 onnx::MatMul_8843%/blocks.9/mlp/up_proj/MatMul_output_0/blocks.9/mlp/up_proj/MatMul"MatMul ~ !/blocks.9/mlp/act_fn/Mul_output_0 %/blocks.9/mlp/up_proj/MatMul_output_0/blocks.9/mlp/Mul_output_0/blocks.9/mlp/Mul"Mul  /blocks.9/mlp/Mul_output_0 onnx::MatMul_8844'/blocks.9/mlp/down_proj/MatMul_output_0/blocks.9/mlp/down_proj/MatMul"MatMul  2/blocks.9/post_attention_layernorm/Cast_1_output_0 '/blocks.9/mlp/down_proj/MatMul_output_0/blocks.9/Add_1_output_0/blocks.9/Add_1"Add `/Constant_3_output_0 /Constant_3"Constant*1 value*%B/Constant_3_attr::valueJ  ] past_key_values /Constant_3_output_0/Gather_10_output_0 /Gather_10"Gather* axis /blocks.10/Constant_output_0/blocks.10/Constant"Constant*K value*?B/blocks.10/Constant_attr::valueJ  /blocks.9/Add_1_output_0 /blocks.10/Constant_output_0/blocks.10/Reshape_output_0/blocks.10/Reshape"Reshape* allowzero y /blocks.10/Reshape_output_0(/blocks.10/input_layernorm/Cast_output_0/blocks.10/input_layernorm/Cast"Cast* to ,/blocks.10/input_layernorm/Constant_output_0#/blocks.10/input_layernorm/Constant"Constant*E value*9B//blocks.10/input_layernorm/Constant_attr::valueJ@  (/blocks.10/input_layernorm/Cast_output_0 ,/blocks.10/input_layernorm/Constant_output_0'/blocks.10/input_layernorm/Pow_output_0/blocks.10/input_layernorm/Pow"Pow  '/blocks.10/input_layernorm/Pow_output_0./blocks.10/input_layernorm/ReduceMean_output_0%/blocks.10/input_layernorm/ReduceMean" ReduceMean* axes@* keepdims ./blocks.10/input_layernorm/Constant_1_output_0%/blocks.10/input_layernorm/Constant_1"Constant*G value*;B1/blocks.10/input_layernorm/Constant_1_attr::valueJ75  ./blocks.10/input_layernorm/ReduceMean_output_0 ./blocks.10/input_layernorm/Constant_1_output_0'/blocks.10/input_layernorm/Add_output_0/blocks.10/input_layernorm/Add"Add z '/blocks.10/input_layernorm/Add_output_0(/blocks.10/input_layernorm/Sqrt_output_0/blocks.10/input_layernorm/Sqrt"Sqrt ./blocks.10/input_layernorm/Constant_2_output_0%/blocks.10/input_layernorm/Constant_2"Constant*G value*;B1/blocks.10/input_layernorm/Constant_2_attr::valueJ?  ./blocks.10/input_layernorm/Constant_2_output_0 (/blocks.10/input_layernorm/Sqrt_output_0'/blocks.10/input_layernorm/Div_output_0/blocks.10/input_layernorm/Div"Div  (/blocks.10/input_layernorm/Cast_output_0*/blocks.10/input_layernorm/Cast_1_output_0!/blocks.10/input_layernorm/Cast_1"Cast* to  */blocks.10/input_layernorm/Cast_1_output_0 '/blocks.10/input_layernorm/Div_output_0'/blocks.10/input_layernorm/Mul_output_0/blocks.10/input_layernorm/Mul"Mul  '/blocks.10/input_layernorm/Mul_output_0 blocks.10.input_layernorm.weight)/blocks.10/input_layernorm/Mul_1_output_0 /blocks.10/input_layernorm/Mul_1"Mul  )/blocks.10/input_layernorm/Mul_1_output_0*/blocks.10/input_layernorm/Cast_2_output_0!/blocks.10/input_layernorm/Cast_2"Cast* to t */blocks.10/input_layernorm/Cast_2_output_0#/blocks.10/self_attn/Shape_output_0/blocks.10/self_attn/Shape"Shape &/blocks.10/self_attn/Constant_output_0/blocks.10/self_attn/Constant"Constant*C value*7B)/blocks.10/self_attn/Constant_attr::valueJ  #/blocks.10/self_attn/Shape_output_0 &/blocks.10/self_attn/Constant_output_0$/blocks.10/self_attn/Gather_output_0/blocks.10/self_attn/Gather"Gather* axis x */blocks.10/input_layernorm/Cast_2_output_0%/blocks.10/self_attn/Shape_1_output_0/blocks.10/self_attn/Shape_1"Shape (/blocks.10/self_attn/Constant_1_output_0/blocks.10/self_attn/Constant_1"Constant*E value*9B+/blocks.10/self_attn/Constant_1_attr::valueJ  %/blocks.10/self_attn/Shape_1_output_0 (/blocks.10/self_attn/Constant_1_output_0&/blocks.10/self_attn/Gather_1_output_0/blocks.10/self_attn/Gather_1"Gather* axis  */blocks.10/input_layernorm/Cast_2_output_0 onnx::MatMul_8845+/blocks.10/self_attn/q_proj/MatMul_output_0"/blocks.10/self_attn/q_proj/MatMul"MatMul  */blocks.10/input_layernorm/Cast_2_output_0 onnx::MatMul_8846+/blocks.10/self_attn/k_proj/MatMul_output_0"/blocks.10/self_attn/k_proj/MatMul"MatMul  */blocks.10/input_layernorm/Cast_2_output_0 onnx::MatMul_8847+/blocks.10/self_attn/v_proj/MatMul_output_0"/blocks.10/self_attn/v_proj/MatMul"MatMul fonnx::Unsqueeze_3278 Constant_5180"Constant*5 value*)BConstant_5180_attr::valueJ  $/blocks.10/self_attn/Gather_output_0 onnx::Unsqueeze_3278'/blocks.10/self_attn/Unsqueeze_output_0/blocks.10/self_attn/Unsqueeze" Unsqueeze fonnx::Unsqueeze_3280 Constant_5182"Constant*5 value*)BConstant_5182_attr::valueJ  &/blocks.10/self_attn/Gather_1_output_0 onnx::Unsqueeze_3280)/blocks.10/self_attn/Unsqueeze_1_output_0 /blocks.10/self_attn/Unsqueeze_1" Unsqueeze (/blocks.10/self_attn/Constant_2_output_0/blocks.10/self_attn/Constant_2"Constant*G value*;B+/blocks.10/self_attn/Constant_2_attr::valueJ (/blocks.10/self_attn/Constant_3_output_0/blocks.10/self_attn/Constant_3"Constant*G value*;B+/blocks.10/self_attn/Constant_3_attr::valueJ  '/blocks.10/self_attn/Unsqueeze_output_0 )/blocks.10/self_attn/Unsqueeze_1_output_0 (/blocks.10/self_attn/Constant_2_output_0 (/blocks.10/self_attn/Constant_3_output_0$/blocks.10/self_attn/Concat_output_0/blocks.10/self_attn/Concat"Concat* axis  +/blocks.10/self_attn/q_proj/MatMul_output_0 $/blocks.10/self_attn/Concat_output_0%/blocks.10/self_attn/Reshape_output_0/blocks.10/self_attn/Reshape"Reshape* allowzero fonnx::Unsqueeze_3288 Constant_5188"Constant*5 value*)BConstant_5188_attr::valueJ  $/blocks.10/self_attn/Gather_output_0 onnx::Unsqueeze_3288)/blocks.10/self_attn/Unsqueeze_2_output_0 /blocks.10/self_attn/Unsqueeze_2" Unsqueeze fonnx::Unsqueeze_3290 Constant_5190"Constant*5 value*)BConstant_5190_attr::valueJ  &/blocks.10/self_attn/Gather_1_output_0 onnx::Unsqueeze_3290)/blocks.10/self_attn/Unsqueeze_3_output_0 /blocks.10/self_attn/Unsqueeze_3" Unsqueeze (/blocks.10/self_attn/Constant_4_output_0/blocks.10/self_attn/Constant_4"Constant*G value*;B+/blocks.10/self_attn/Constant_4_attr::valueJ (/blocks.10/self_attn/Constant_5_output_0/blocks.10/self_attn/Constant_5"Constant*G value*;B+/blocks.10/self_attn/Constant_5_attr::valueJ  )/blocks.10/self_attn/Unsqueeze_2_output_0 )/blocks.10/self_attn/Unsqueeze_3_output_0 (/blocks.10/self_attn/Constant_4_output_0 (/blocks.10/self_attn/Constant_5_output_0&/blocks.10/self_attn/Concat_1_output_0/blocks.10/self_attn/Concat_1"Concat* axis fonnx::Unsqueeze_3297 Constant_5195"Constant*5 value*)BConstant_5195_attr::valueJ  $/blocks.10/self_attn/Gather_output_0 onnx::Unsqueeze_3297)/blocks.10/self_attn/Unsqueeze_4_output_0 /blocks.10/self_attn/Unsqueeze_4" Unsqueeze fonnx::Unsqueeze_3299 Constant_5197"Constant*5 value*)BConstant_5197_attr::valueJ  &/blocks.10/self_attn/Gather_1_output_0 onnx::Unsqueeze_3299)/blocks.10/self_attn/Unsqueeze_5_output_0 /blocks.10/self_attn/Unsqueeze_5" Unsqueeze (/blocks.10/self_attn/Constant_6_output_0/blocks.10/self_attn/Constant_6"Constant*G value*;B+/blocks.10/self_attn/Constant_6_attr::valueJ (/blocks.10/self_attn/Constant_7_output_0/blocks.10/self_attn/Constant_7"Constant*G value*;B+/blocks.10/self_attn/Constant_7_attr::valueJ  )/blocks.10/self_attn/Unsqueeze_4_output_0 )/blocks.10/self_attn/Unsqueeze_5_output_0 (/blocks.10/self_attn/Constant_6_output_0 (/blocks.10/self_attn/Constant_7_output_0&/blocks.10/self_attn/Concat_2_output_0/blocks.10/self_attn/Concat_2"Concat* axis  +/blocks.10/self_attn/k_proj/MatMul_output_0 &/blocks.10/self_attn/Concat_1_output_0'/blocks.10/self_attn/Reshape_1_output_0/blocks.10/self_attn/Reshape_1"Reshape* allowzero  +/blocks.10/self_attn/v_proj/MatMul_output_0 &/blocks.10/self_attn/Concat_2_output_0'/blocks.10/self_attn/Reshape_2_output_0/blocks.10/self_attn/Reshape_2"Reshape* allowzero  %/blocks.10/self_attn/Reshape_output_0)/blocks.10/self_attn/q_norm/Cast_output_0 /blocks.10/self_attn/q_norm/Cast"Cast* to -/blocks.10/self_attn/q_norm/Constant_output_0$/blocks.10/self_attn/q_norm/Constant"Constant*F value*:B0/blocks.10/self_attn/q_norm/Constant_attr::valueJ@  )/blocks.10/self_attn/q_norm/Cast_output_0 -/blocks.10/self_attn/q_norm/Constant_output_0(/blocks.10/self_attn/q_norm/Pow_output_0/blocks.10/self_attn/q_norm/Pow"Pow  (/blocks.10/self_attn/q_norm/Pow_output_0//blocks.10/self_attn/q_norm/ReduceMean_output_0&/blocks.10/self_attn/q_norm/ReduceMean" ReduceMean* axes@* keepdims //blocks.10/self_attn/q_norm/Constant_1_output_0&/blocks.10/self_attn/q_norm/Constant_1"Constant*H value*<B2/blocks.10/self_attn/q_norm/Constant_1_attr::valueJ75  //blocks.10/self_attn/q_norm/ReduceMean_output_0 //blocks.10/self_attn/q_norm/Constant_1_output_0(/blocks.10/self_attn/q_norm/Add_output_0/blocks.10/self_attn/q_norm/Add"Add } (/blocks.10/self_attn/q_norm/Add_output_0)/blocks.10/self_attn/q_norm/Sqrt_output_0 /blocks.10/self_attn/q_norm/Sqrt"Sqrt //blocks.10/self_attn/q_norm/Constant_2_output_0&/blocks.10/self_attn/q_norm/Constant_2"Constant*H value*<B2/blocks.10/self_attn/q_norm/Constant_2_attr::valueJ?  //blocks.10/self_attn/q_norm/Constant_2_output_0 )/blocks.10/self_attn/q_norm/Sqrt_output_0(/blocks.10/self_attn/q_norm/Div_output_0/blocks.10/self_attn/q_norm/Div"Div  )/blocks.10/self_attn/q_norm/Cast_output_0+/blocks.10/self_attn/q_norm/Cast_1_output_0"/blocks.10/self_attn/q_norm/Cast_1"Cast* to  +/blocks.10/self_attn/q_norm/Cast_1_output_0 (/blocks.10/self_attn/q_norm/Div_output_0(/blocks.10/self_attn/q_norm/Mul_output_0/blocks.10/self_attn/q_norm/Mul"Mul  (/blocks.10/self_attn/q_norm/Mul_output_0 !blocks.10.self_attn.q_norm.weight*/blocks.10/self_attn/q_norm/Mul_1_output_0!/blocks.10/self_attn/q_norm/Mul_1"Mul  */blocks.10/self_attn/q_norm/Mul_1_output_0+/blocks.10/self_attn/q_norm/Cast_2_output_0"/blocks.10/self_attn/q_norm/Cast_2"Cast* to  '/blocks.10/self_attn/Reshape_1_output_0)/blocks.10/self_attn/k_norm/Cast_output_0 /blocks.10/self_attn/k_norm/Cast"Cast* to -/blocks.10/self_attn/k_norm/Constant_output_0$/blocks.10/self_attn/k_norm/Constant"Constant*F value*:B0/blocks.10/self_attn/k_norm/Constant_attr::valueJ@  )/blocks.10/self_attn/k_norm/Cast_output_0 -/blocks.10/self_attn/k_norm/Constant_output_0(/blocks.10/self_attn/k_norm/Pow_output_0/blocks.10/self_attn/k_norm/Pow"Pow  (/blocks.10/self_attn/k_norm/Pow_output_0//blocks.10/self_attn/k_norm/ReduceMean_output_0&/blocks.10/self_attn/k_norm/ReduceMean" ReduceMean* axes@* keepdims //blocks.10/self_attn/k_norm/Constant_1_output_0&/blocks.10/self_attn/k_norm/Constant_1"Constant*H value*<B2/blocks.10/self_attn/k_norm/Constant_1_attr::valueJ75  //blocks.10/self_attn/k_norm/ReduceMean_output_0 //blocks.10/self_attn/k_norm/Constant_1_output_0(/blocks.10/self_attn/k_norm/Add_output_0/blocks.10/self_attn/k_norm/Add"Add } (/blocks.10/self_attn/k_norm/Add_output_0)/blocks.10/self_attn/k_norm/Sqrt_output_0 /blocks.10/self_attn/k_norm/Sqrt"Sqrt //blocks.10/self_attn/k_norm/Constant_2_output_0&/blocks.10/self_attn/k_norm/Constant_2"Constant*H value*<B2/blocks.10/self_attn/k_norm/Constant_2_attr::valueJ?  //blocks.10/self_attn/k_norm/Constant_2_output_0 )/blocks.10/self_attn/k_norm/Sqrt_output_0(/blocks.10/self_attn/k_norm/Div_output_0/blocks.10/self_attn/k_norm/Div"Div  )/blocks.10/self_attn/k_norm/Cast_output_0+/blocks.10/self_attn/k_norm/Cast_1_output_0"/blocks.10/self_attn/k_norm/Cast_1"Cast* to  +/blocks.10/self_attn/k_norm/Cast_1_output_0 (/blocks.10/self_attn/k_norm/Div_output_0(/blocks.10/self_attn/k_norm/Mul_output_0/blocks.10/self_attn/k_norm/Mul"Mul  (/blocks.10/self_attn/k_norm/Mul_output_0 !blocks.10.self_attn.k_norm.weight*/blocks.10/self_attn/k_norm/Mul_1_output_0!/blocks.10/self_attn/k_norm/Mul_1"Mul  */blocks.10/self_attn/k_norm/Mul_1_output_0+/blocks.10/self_attn/k_norm/Cast_2_output_0"/blocks.10/self_attn/k_norm/Cast_2"Cast* to  +/blocks.10/self_attn/q_norm/Cast_2_output_0 %/blocks.0/self_attn/Gather_2_output_0!/blocks.10/self_attn/Mul_output_0/blocks.10/self_attn/Mul"Mul y +/blocks.10/self_attn/q_norm/Cast_2_output_0%/blocks.10/self_attn/Shape_2_output_0/blocks.10/self_attn/Shape_2"Shape (/blocks.10/self_attn/Constant_8_output_0/blocks.10/self_attn/Constant_8"Constant*E value*9B+/blocks.10/self_attn/Constant_8_attr::valueJ  %/blocks.10/self_attn/Shape_2_output_0 (/blocks.10/self_attn/Constant_8_output_0&/blocks.10/self_attn/Gather_2_output_0/blocks.10/self_attn/Gather_2"Gather* axis (/blocks.10/self_attn/Constant_9_output_0/blocks.10/self_attn/Constant_9"Constant*E value*9B+/blocks.10/self_attn/Constant_9_attr::valueJ  &/blocks.10/self_attn/Gather_2_output_0 (/blocks.10/self_attn/Constant_9_output_0!/blocks.10/self_attn/Div_output_0/blocks.10/self_attn/Div"Div s !/blocks.10/self_attn/Div_output_0"/blocks.10/self_attn/Cast_output_0/blocks.10/self_attn/Cast"Cast* to x "/blocks.10/self_attn/Cast_output_0$/blocks.10/self_attn/Cast_1_output_0/blocks.10/self_attn/Cast_1"Cast* to )/blocks.10/self_attn/Constant_10_output_0 /blocks.10/self_attn/Constant_10"Constant*H value*<B,/blocks.10/self_attn/Constant_10_attr::valueJ )/blocks.10/self_attn/Constant_11_output_0 /blocks.10/self_attn/Constant_11"Constant*H value*<B,/blocks.10/self_attn/Constant_11_attr::valueJ )/blocks.10/self_attn/Constant_12_output_0 /blocks.10/self_attn/Constant_12"Constant*H value*<B,/blocks.10/self_attn/Constant_12_attr::valueJ  $/blocks.10/self_attn/Cast_1_output_0 )/blocks.10/self_attn/Constant_12_output_0)/blocks.10/self_attn/Unsqueeze_6_output_0 /blocks.10/self_attn/Unsqueeze_6" Unsqueeze )/blocks.10/self_attn/Constant_13_output_0 /blocks.10/self_attn/Constant_13"Constant*H value*<B,/blocks.10/self_attn/Constant_13_attr::valueJ  +/blocks.10/self_attn/q_norm/Cast_2_output_0 )/blocks.10/self_attn/Constant_11_output_0 )/blocks.10/self_attn/Unsqueeze_6_output_0 )/blocks.10/self_attn/Constant_10_output_0 )/blocks.10/self_attn/Constant_13_output_0#/blocks.10/self_attn/Slice_output_0/blocks.10/self_attn/Slice"Slice )/blocks.10/self_attn/Constant_14_output_0 /blocks.10/self_attn/Constant_14"Constant*H value*<B,/blocks.10/self_attn/Constant_14_attr::valueJ )/blocks.10/self_attn/Constant_15_output_0 /blocks.10/self_attn/Constant_15"Constant*H value*<B,/blocks.10/self_attn/Constant_15_attr::valueJ  $/blocks.10/self_attn/Cast_1_output_0 )/blocks.10/self_attn/Constant_15_output_0)/blocks.10/self_attn/Unsqueeze_7_output_0 /blocks.10/self_attn/Unsqueeze_7" Unsqueeze )/blocks.10/self_attn/Constant_16_output_0 /blocks.10/self_attn/Constant_16"Constant*H value*<B,/blocks.10/self_attn/Constant_16_attr::valueJ )/blocks.10/self_attn/Constant_17_output_0 /blocks.10/self_attn/Constant_17"Constant*H value*<B,/blocks.10/self_attn/Constant_17_attr::valueJ  +/blocks.10/self_attn/q_norm/Cast_2_output_0 )/blocks.10/self_attn/Unsqueeze_7_output_0 )/blocks.10/self_attn/Constant_16_output_0 )/blocks.10/self_attn/Constant_14_output_0 )/blocks.10/self_attn/Constant_17_output_0%/blocks.10/self_attn/Slice_1_output_0/blocks.10/self_attn/Slice_1"Slice i %/blocks.10/self_attn/Slice_1_output_0!/blocks.10/self_attn/Neg_output_0/blocks.10/self_attn/Neg"Neg  !/blocks.10/self_attn/Neg_output_0 #/blocks.10/self_attn/Slice_output_0&/blocks.10/self_attn/Concat_3_output_0/blocks.10/self_attn/Concat_3"Concat* axis  &/blocks.10/self_attn/Concat_3_output_0 %/blocks.0/self_attn/Gather_3_output_0#/blocks.10/self_attn/Mul_1_output_0/blocks.10/self_attn/Mul_1"Mul  !/blocks.10/self_attn/Mul_output_0 #/blocks.10/self_attn/Mul_1_output_0!/blocks.10/self_attn/Add_output_0/blocks.10/self_attn/Add"Add  +/blocks.10/self_attn/k_norm/Cast_2_output_0 %/blocks.0/self_attn/Gather_2_output_0#/blocks.10/self_attn/Mul_2_output_0/blocks.10/self_attn/Mul_2"Mul y +/blocks.10/self_attn/k_norm/Cast_2_output_0%/blocks.10/self_attn/Shape_3_output_0/blocks.10/self_attn/Shape_3"Shape )/blocks.10/self_attn/Constant_18_output_0 /blocks.10/self_attn/Constant_18"Constant*F value*:B,/blocks.10/self_attn/Constant_18_attr::valueJ  %/blocks.10/self_attn/Shape_3_output_0 )/blocks.10/self_attn/Constant_18_output_0&/blocks.10/self_attn/Gather_3_output_0/blocks.10/self_attn/Gather_3"Gather* axis )/blocks.10/self_attn/Constant_19_output_0 /blocks.10/self_attn/Constant_19"Constant*F value*:B,/blocks.10/self_attn/Constant_19_attr::valueJ  &/blocks.10/self_attn/Gather_3_output_0 )/blocks.10/self_attn/Constant_19_output_0#/blocks.10/self_attn/Div_1_output_0/blocks.10/self_attn/Div_1"Div y #/blocks.10/self_attn/Div_1_output_0$/blocks.10/self_attn/Cast_2_output_0/blocks.10/self_attn/Cast_2"Cast* to z $/blocks.10/self_attn/Cast_2_output_0$/blocks.10/self_attn/Cast_3_output_0/blocks.10/self_attn/Cast_3"Cast* to )/blocks.10/self_attn/Constant_20_output_0 /blocks.10/self_attn/Constant_20"Constant*H value*<B,/blocks.10/self_attn/Constant_20_attr::valueJ )/blocks.10/self_attn/Constant_21_output_0 /blocks.10/self_attn/Constant_21"Constant*H value*<B,/blocks.10/self_attn/Constant_21_attr::valueJ )/blocks.10/self_attn/Constant_22_output_0 /blocks.10/self_attn/Constant_22"Constant*H value*<B,/blocks.10/self_attn/Constant_22_attr::valueJ  $/blocks.10/self_attn/Cast_3_output_0 )/blocks.10/self_attn/Constant_22_output_0)/blocks.10/self_attn/Unsqueeze_8_output_0 /blocks.10/self_attn/Unsqueeze_8" Unsqueeze )/blocks.10/self_attn/Constant_23_output_0 /blocks.10/self_attn/Constant_23"Constant*H value*<B,/blocks.10/self_attn/Constant_23_attr::valueJ  +/blocks.10/self_attn/k_norm/Cast_2_output_0 )/blocks.10/self_attn/Constant_21_output_0 )/blocks.10/self_attn/Unsqueeze_8_output_0 )/blocks.10/self_attn/Constant_20_output_0 )/blocks.10/self_attn/Constant_23_output_0%/blocks.10/self_attn/Slice_2_output_0/blocks.10/self_attn/Slice_2"Slice )/blocks.10/self_attn/Constant_24_output_0 /blocks.10/self_attn/Constant_24"Constant*H value*<B,/blocks.10/self_attn/Constant_24_attr::valueJ )/blocks.10/self_attn/Constant_25_output_0 /blocks.10/self_attn/Constant_25"Constant*H value*<B,/blocks.10/self_attn/Constant_25_attr::valueJ  $/blocks.10/self_attn/Cast_3_output_0 )/blocks.10/self_attn/Constant_25_output_0)/blocks.10/self_attn/Unsqueeze_9_output_0 /blocks.10/self_attn/Unsqueeze_9" Unsqueeze )/blocks.10/self_attn/Constant_26_output_0 /blocks.10/self_attn/Constant_26"Constant*H value*<B,/blocks.10/self_attn/Constant_26_attr::valueJ )/blocks.10/self_attn/Constant_27_output_0 /blocks.10/self_attn/Constant_27"Constant*H value*<B,/blocks.10/self_attn/Constant_27_attr::valueJ  +/blocks.10/self_attn/k_norm/Cast_2_output_0 )/blocks.10/self_attn/Unsqueeze_9_output_0 )/blocks.10/self_attn/Constant_26_output_0 )/blocks.10/self_attn/Constant_24_output_0 )/blocks.10/self_attn/Constant_27_output_0%/blocks.10/self_attn/Slice_3_output_0/blocks.10/self_attn/Slice_3"Slice m %/blocks.10/self_attn/Slice_3_output_0#/blocks.10/self_attn/Neg_1_output_0/blocks.10/self_attn/Neg_1"Neg  #/blocks.10/self_attn/Neg_1_output_0 %/blocks.10/self_attn/Slice_2_output_0&/blocks.10/self_attn/Concat_4_output_0/blocks.10/self_attn/Concat_4"Concat* axis  &/blocks.10/self_attn/Concat_4_output_0 %/blocks.0/self_attn/Gather_3_output_0#/blocks.10/self_attn/Mul_3_output_0/blocks.10/self_attn/Mul_3"Mul  #/blocks.10/self_attn/Mul_2_output_0 #/blocks.10/self_attn/Mul_3_output_0#/blocks.10/self_attn/Add_1_output_0/blocks.10/self_attn/Add_1"Add  /Gather_10_output_0 /rotary/Constant_3_output_0&/blocks.10/self_attn/Gather_4_output_0/blocks.10/self_attn/Gather_4"Gather* axis  /Gather_10_output_0 /rotary/Constant_8_output_0&/blocks.10/self_attn/Gather_5_output_0/blocks.10/self_attn/Gather_5"Gather* axis  &/blocks.10/self_attn/Gather_4_output_0 #/blocks.10/self_attn/Add_1_output_0&/blocks.10/self_attn/Concat_5_output_0/blocks.10/self_attn/Concat_5"Concat* axis  &/blocks.10/self_attn/Gather_5_output_0 '/blocks.10/self_attn/Reshape_2_output_0&/blocks.10/self_attn/Concat_6_output_0/blocks.10/self_attn/Concat_6"Concat* axis )/blocks.10/self_attn/Constant_28_output_0 /blocks.10/self_attn/Constant_28"Constant*H value*<B,/blocks.10/self_attn/Constant_28_attr::valueJ  &/blocks.10/self_attn/Concat_5_output_0 )/blocks.10/self_attn/Constant_28_output_0*/blocks.10/self_attn/Unsqueeze_10_output_0!/blocks.10/self_attn/Unsqueeze_10" Unsqueeze )/blocks.10/self_attn/Constant_29_output_0 /blocks.10/self_attn/Constant_29"Constant*H value*<B,/blocks.10/self_attn/Constant_29_attr::valueJ  &/blocks.10/self_attn/Concat_6_output_0 )/blocks.10/self_attn/Constant_29_output_0*/blocks.10/self_attn/Unsqueeze_11_output_0!/blocks.10/self_attn/Unsqueeze_11" Unsqueeze  */blocks.10/self_attn/Unsqueeze_10_output_0 */blocks.10/self_attn/Unsqueeze_11_output_0&/blocks.10/self_attn/Concat_7_output_0/blocks.10/self_attn/Concat_7"Concat* axis  !/blocks.10/self_attn/Add_output_0'/blocks.10/self_attn/Transpose_output_0/blocks.10/self_attn/Transpose" Transpose* perm@@@@  &/blocks.10/self_attn/Concat_5_output_0)/blocks.10/self_attn/Transpose_1_output_0 /blocks.10/self_attn/Transpose_1" Transpose* perm@@@@  &/blocks.10/self_attn/Concat_6_output_0)/blocks.10/self_attn/Transpose_2_output_0 /blocks.10/self_attn/Transpose_2" Transpose* perm@@@@ w )/blocks.10/self_attn/Transpose_1_output_0%/blocks.10/self_attn/Shape_4_output_0/blocks.10/self_attn/Shape_4"Shape )/blocks.10/self_attn/Constant_30_output_0 /blocks.10/self_attn/Constant_30"Constant*F value*:B,/blocks.10/self_attn/Constant_30_attr::valueJ  %/blocks.10/self_attn/Shape_4_output_0 )/blocks.10/self_attn/Constant_30_output_0&/blocks.10/self_attn/Gather_6_output_0/blocks.10/self_attn/Gather_6"Gather* axis w )/blocks.10/self_attn/Transpose_1_output_0%/blocks.10/self_attn/Shape_5_output_0/blocks.10/self_attn/Shape_5"Shape )/blocks.10/self_attn/Constant_31_output_0 /blocks.10/self_attn/Constant_31"Constant*F value*:B,/blocks.10/self_attn/Constant_31_attr::valueJ  %/blocks.10/self_attn/Shape_5_output_0 )/blocks.10/self_attn/Constant_31_output_0&/blocks.10/self_attn/Gather_7_output_0/blocks.10/self_attn/Gather_7"Gather* axis w )/blocks.10/self_attn/Transpose_1_output_0%/blocks.10/self_attn/Shape_6_output_0/blocks.10/self_attn/Shape_6"Shape )/blocks.10/self_attn/Constant_32_output_0 /blocks.10/self_attn/Constant_32"Constant*F value*:B,/blocks.10/self_attn/Constant_32_attr::valueJ  %/blocks.10/self_attn/Shape_6_output_0 )/blocks.10/self_attn/Constant_32_output_0&/blocks.10/self_attn/Gather_8_output_0/blocks.10/self_attn/Gather_8"Gather* axis w )/blocks.10/self_attn/Transpose_1_output_0%/blocks.10/self_attn/Shape_7_output_0/blocks.10/self_attn/Shape_7"Shape )/blocks.10/self_attn/Constant_33_output_0 /blocks.10/self_attn/Constant_33"Constant*F value*:B,/blocks.10/self_attn/Constant_33_attr::valueJ  %/blocks.10/self_attn/Shape_7_output_0 )/blocks.10/self_attn/Constant_33_output_0&/blocks.10/self_attn/Gather_9_output_0/blocks.10/self_attn/Gather_9"Gather* axis )/blocks.10/self_attn/Constant_34_output_0 /blocks.10/self_attn/Constant_34"Constant*H value*<B,/blocks.10/self_attn/Constant_34_attr::valueJ  )/blocks.10/self_attn/Transpose_1_output_0 )/blocks.10/self_attn/Constant_34_output_0*/blocks.10/self_attn/Unsqueeze_12_output_0!/blocks.10/self_attn/Unsqueeze_12" Unsqueeze )/blocks.10/self_attn/Constant_35_output_0 /blocks.10/self_attn/Constant_35"Constant*H value*<B,/blocks.10/self_attn/Constant_35_attr::valueJ  &/blocks.10/self_attn/Gather_6_output_0 )/blocks.10/self_attn/Constant_35_output_0*/blocks.10/self_attn/Unsqueeze_13_output_0!/blocks.10/self_attn/Unsqueeze_13" Unsqueeze )/blocks.10/self_attn/Constant_36_output_0 /blocks.10/self_attn/Constant_36"Constant*H value*<B,/blocks.10/self_attn/Constant_36_attr::valueJ  &/blocks.10/self_attn/Gather_7_output_0 )/blocks.10/self_attn/Constant_36_output_0*/blocks.10/self_attn/Unsqueeze_14_output_0!/blocks.10/self_attn/Unsqueeze_14" Unsqueeze )/blocks.10/self_attn/Constant_37_output_0 /blocks.10/self_attn/Constant_37"Constant*H value*<B,/blocks.10/self_attn/Constant_37_attr::valueJ )/blocks.10/self_attn/Constant_38_output_0 /blocks.10/self_attn/Constant_38"Constant*H value*<B,/blocks.10/self_attn/Constant_38_attr::valueJ  &/blocks.10/self_attn/Gather_8_output_0 )/blocks.10/self_attn/Constant_38_output_0*/blocks.10/self_attn/Unsqueeze_15_output_0!/blocks.10/self_attn/Unsqueeze_15" Unsqueeze )/blocks.10/self_attn/Constant_39_output_0 /blocks.10/self_attn/Constant_39"Constant*H value*<B,/blocks.10/self_attn/Constant_39_attr::valueJ  &/blocks.10/self_attn/Gather_9_output_0 )/blocks.10/self_attn/Constant_39_output_0*/blocks.10/self_attn/Unsqueeze_16_output_0!/blocks.10/self_attn/Unsqueeze_16" Unsqueeze  */blocks.10/self_attn/Unsqueeze_13_output_0 */blocks.10/self_attn/Unsqueeze_14_output_0 )/blocks.10/self_attn/Constant_37_output_0 */blocks.10/self_attn/Unsqueeze_15_output_0 */blocks.10/self_attn/Unsqueeze_16_output_0&/blocks.10/self_attn/Concat_8_output_0/blocks.10/self_attn/Concat_8"Concat* axis )/blocks.10/self_attn/Constant_40_output_0 /blocks.10/self_attn/Constant_40"Constant*H value*<B,/blocks.10/self_attn/Constant_40_attr::valueJ  &/blocks.10/self_attn/Concat_8_output_0 )/blocks.10/self_attn/Constant_40_output_0'/blocks.10/self_attn/Reshape_3_output_0/blocks.10/self_attn/Reshape_3"Reshape* allowzero u '/blocks.10/self_attn/Reshape_3_output_0%/blocks.10/self_attn/Shape_8_output_0/blocks.10/self_attn/Shape_8"Shape  %/blocks.10/self_attn/Shape_8_output_0-/blocks.10/self_attn/ConstantOfShape_output_0$/blocks.10/self_attn/ConstantOfShape"ConstantOfShape*L value*@B0/blocks.10/self_attn/ConstantOfShape_attr::valueJ )/blocks.10/self_attn/Constant_41_output_0 /blocks.10/self_attn/Constant_41"Constant*F value*:B,/blocks.10/self_attn/Constant_41_attr::valueJ  -/blocks.10/self_attn/ConstantOfShape_output_0 )/blocks.10/self_attn/Constant_41_output_0#/blocks.10/self_attn/Mul_4_output_0/blocks.10/self_attn/Mul_4"Mul  '/blocks.10/self_attn/Reshape_3_output_0 #/blocks.10/self_attn/Mul_4_output_0#/blocks.10/self_attn/Equal_output_0/blocks.10/self_attn/Equal"Equal  #/blocks.10/self_attn/Equal_output_0 -/blocks.10/self_attn/ConstantOfShape_output_0 '/blocks.10/self_attn/Reshape_3_output_0#/blocks.10/self_attn/Where_output_0/blocks.10/self_attn/Where"Where  */blocks.10/self_attn/Unsqueeze_12_output_0 #/blocks.10/self_attn/Where_output_0$/blocks.10/self_attn/Expand_output_0/blocks.10/self_attn/Expand"Expand )/blocks.10/self_attn/Constant_42_output_0 /blocks.10/self_attn/Constant_42"Constant*F value*:B,/blocks.10/self_attn/Constant_42_attr::valueJ  &/blocks.10/self_attn/Gather_7_output_0 )/blocks.10/self_attn/Constant_42_output_0#/blocks.10/self_attn/Mul_5_output_0/blocks.10/self_attn/Mul_5"Mul fonnx::Unsqueeze_3442 Constant_5325"Constant*5 value*)BConstant_5325_attr::valueJ  &/blocks.10/self_attn/Gather_6_output_0 onnx::Unsqueeze_3442*/blocks.10/self_attn/Unsqueeze_17_output_0!/blocks.10/self_attn/Unsqueeze_17" Unsqueeze fonnx::Unsqueeze_3444 Constant_5327"Constant*5 value*)BConstant_5327_attr::valueJ  #/blocks.10/self_attn/Mul_5_output_0 onnx::Unsqueeze_3444*/blocks.10/self_attn/Unsqueeze_18_output_0!/blocks.10/self_attn/Unsqueeze_18" Unsqueeze fonnx::Unsqueeze_3446 Constant_5329"Constant*5 value*)BConstant_5329_attr::valueJ  &/blocks.10/self_attn/Gather_8_output_0 onnx::Unsqueeze_3446*/blocks.10/self_attn/Unsqueeze_19_output_0!/blocks.10/self_attn/Unsqueeze_19" Unsqueeze fonnx::Unsqueeze_3448 Constant_5331"Constant*5 value*)BConstant_5331_attr::valueJ  &/blocks.10/self_attn/Gather_9_output_0 onnx::Unsqueeze_3448*/blocks.10/self_attn/Unsqueeze_20_output_0!/blocks.10/self_attn/Unsqueeze_20" Unsqueeze  */blocks.10/self_attn/Unsqueeze_17_output_0 */blocks.10/self_attn/Unsqueeze_18_output_0 */blocks.10/self_attn/Unsqueeze_19_output_0 */blocks.10/self_attn/Unsqueeze_20_output_0&/blocks.10/self_attn/Concat_9_output_0/blocks.10/self_attn/Concat_9"Concat* axis  $/blocks.10/self_attn/Expand_output_0 &/blocks.10/self_attn/Concat_9_output_0'/blocks.10/self_attn/Reshape_4_output_0/blocks.10/self_attn/Reshape_4"Reshape* allowzero w )/blocks.10/self_attn/Transpose_2_output_0%/blocks.10/self_attn/Shape_9_output_0/blocks.10/self_attn/Shape_9"Shape )/blocks.10/self_attn/Constant_43_output_0 /blocks.10/self_attn/Constant_43"Constant*F value*:B,/blocks.10/self_attn/Constant_43_attr::valueJ  %/blocks.10/self_attn/Shape_9_output_0 )/blocks.10/self_attn/Constant_43_output_0'/blocks.10/self_attn/Gather_10_output_0/blocks.10/self_attn/Gather_10"Gather* axis y )/blocks.10/self_attn/Transpose_2_output_0&/blocks.10/self_attn/Shape_10_output_0/blocks.10/self_attn/Shape_10"Shape )/blocks.10/self_attn/Constant_44_output_0 /blocks.10/self_attn/Constant_44"Constant*F value*:B,/blocks.10/self_attn/Constant_44_attr::valueJ  &/blocks.10/self_attn/Shape_10_output_0 )/blocks.10/self_attn/Constant_44_output_0'/blocks.10/self_attn/Gather_11_output_0/blocks.10/self_attn/Gather_11"Gather* axis y )/blocks.10/self_attn/Transpose_2_output_0&/blocks.10/self_attn/Shape_11_output_0/blocks.10/self_attn/Shape_11"Shape )/blocks.10/self_attn/Constant_45_output_0 /blocks.10/self_attn/Constant_45"Constant*F value*:B,/blocks.10/self_attn/Constant_45_attr::valueJ  &/blocks.10/self_attn/Shape_11_output_0 )/blocks.10/self_attn/Constant_45_output_0'/blocks.10/self_attn/Gather_12_output_0/blocks.10/self_attn/Gather_12"Gather* axis y )/blocks.10/self_attn/Transpose_2_output_0&/blocks.10/self_attn/Shape_12_output_0/blocks.10/self_attn/Shape_12"Shape )/blocks.10/self_attn/Constant_46_output_0 /blocks.10/self_attn/Constant_46"Constant*F value*:B,/blocks.10/self_attn/Constant_46_attr::valueJ  &/blocks.10/self_attn/Shape_12_output_0 )/blocks.10/self_attn/Constant_46_output_0'/blocks.10/self_attn/Gather_13_output_0/blocks.10/self_attn/Gather_13"Gather* axis )/blocks.10/self_attn/Constant_47_output_0 /blocks.10/self_attn/Constant_47"Constant*H value*<B,/blocks.10/self_attn/Constant_47_attr::valueJ  )/blocks.10/self_attn/Transpose_2_output_0 )/blocks.10/self_attn/Constant_47_output_0*/blocks.10/self_attn/Unsqueeze_21_output_0!/blocks.10/self_attn/Unsqueeze_21" Unsqueeze )/blocks.10/self_attn/Constant_48_output_0 /blocks.10/self_attn/Constant_48"Constant*H value*<B,/blocks.10/self_attn/Constant_48_attr::valueJ  '/blocks.10/self_attn/Gather_10_output_0 )/blocks.10/self_attn/Constant_48_output_0*/blocks.10/self_attn/Unsqueeze_22_output_0!/blocks.10/self_attn/Unsqueeze_22" Unsqueeze )/blocks.10/self_attn/Constant_49_output_0 /blocks.10/self_attn/Constant_49"Constant*H value*<B,/blocks.10/self_attn/Constant_49_attr::valueJ  '/blocks.10/self_attn/Gather_11_output_0 )/blocks.10/self_attn/Constant_49_output_0*/blocks.10/self_attn/Unsqueeze_23_output_0!/blocks.10/self_attn/Unsqueeze_23" Unsqueeze )/blocks.10/self_attn/Constant_50_output_0 /blocks.10/self_attn/Constant_50"Constant*H value*<B,/blocks.10/self_attn/Constant_50_attr::valueJ )/blocks.10/self_attn/Constant_51_output_0 /blocks.10/self_attn/Constant_51"Constant*H value*<B,/blocks.10/self_attn/Constant_51_attr::valueJ  '/blocks.10/self_attn/Gather_12_output_0 )/blocks.10/self_attn/Constant_51_output_0*/blocks.10/self_attn/Unsqueeze_24_output_0!/blocks.10/self_attn/Unsqueeze_24" Unsqueeze )/blocks.10/self_attn/Constant_52_output_0 /blocks.10/self_attn/Constant_52"Constant*H value*<B,/blocks.10/self_attn/Constant_52_attr::valueJ  '/blocks.10/self_attn/Gather_13_output_0 )/blocks.10/self_attn/Constant_52_output_0*/blocks.10/self_attn/Unsqueeze_25_output_0!/blocks.10/self_attn/Unsqueeze_25" Unsqueeze  */blocks.10/self_attn/Unsqueeze_22_output_0 */blocks.10/self_attn/Unsqueeze_23_output_0 )/blocks.10/self_attn/Constant_50_output_0 */blocks.10/self_attn/Unsqueeze_24_output_0 */blocks.10/self_attn/Unsqueeze_25_output_0'/blocks.10/self_attn/Concat_10_output_0/blocks.10/self_attn/Concat_10"Concat* axis )/blocks.10/self_attn/Constant_53_output_0 /blocks.10/self_attn/Constant_53"Constant*H value*<B,/blocks.10/self_attn/Constant_53_attr::valueJ  '/blocks.10/self_attn/Concat_10_output_0 )/blocks.10/self_attn/Constant_53_output_0'/blocks.10/self_attn/Reshape_5_output_0/blocks.10/self_attn/Reshape_5"Reshape* allowzero w '/blocks.10/self_attn/Reshape_5_output_0&/blocks.10/self_attn/Shape_13_output_0/blocks.10/self_attn/Shape_13"Shape  &/blocks.10/self_attn/Shape_13_output_0//blocks.10/self_attn/ConstantOfShape_1_output_0&/blocks.10/self_attn/ConstantOfShape_1"ConstantOfShape*N value*BB2/blocks.10/self_attn/ConstantOfShape_1_attr::valueJ )/blocks.10/self_attn/Constant_54_output_0 /blocks.10/self_attn/Constant_54"Constant*F value*:B,/blocks.10/self_attn/Constant_54_attr::valueJ  //blocks.10/self_attn/ConstantOfShape_1_output_0 )/blocks.10/self_attn/Constant_54_output_0#/blocks.10/self_attn/Mul_6_output_0/blocks.10/self_attn/Mul_6"Mul  '/blocks.10/self_attn/Reshape_5_output_0 #/blocks.10/self_attn/Mul_6_output_0%/blocks.10/self_attn/Equal_1_output_0/blocks.10/self_attn/Equal_1"Equal  %/blocks.10/self_attn/Equal_1_output_0 //blocks.10/self_attn/ConstantOfShape_1_output_0 '/blocks.10/self_attn/Reshape_5_output_0%/blocks.10/self_attn/Where_1_output_0/blocks.10/self_attn/Where_1"Where  */blocks.10/self_attn/Unsqueeze_21_output_0 %/blocks.10/self_attn/Where_1_output_0&/blocks.10/self_attn/Expand_1_output_0/blocks.10/self_attn/Expand_1"Expand )/blocks.10/self_attn/Constant_55_output_0 /blocks.10/self_attn/Constant_55"Constant*F value*:B,/blocks.10/self_attn/Constant_55_attr::valueJ  '/blocks.10/self_attn/Gather_11_output_0 )/blocks.10/self_attn/Constant_55_output_0#/blocks.10/self_attn/Mul_7_output_0/blocks.10/self_attn/Mul_7"Mul fonnx::Unsqueeze_3488 Constant_5370"Constant*5 value*)BConstant_5370_attr::valueJ  '/blocks.10/self_attn/Gather_10_output_0 onnx::Unsqueeze_3488*/blocks.10/self_attn/Unsqueeze_26_output_0!/blocks.10/self_attn/Unsqueeze_26" Unsqueeze fonnx::Unsqueeze_3490 Constant_5372"Constant*5 value*)BConstant_5372_attr::valueJ  #/blocks.10/self_attn/Mul_7_output_0 onnx::Unsqueeze_3490*/blocks.10/self_attn/Unsqueeze_27_output_0!/blocks.10/self_attn/Unsqueeze_27" Unsqueeze fonnx::Unsqueeze_3492 Constant_5374"Constant*5 value*)BConstant_5374_attr::valueJ  '/blocks.10/self_attn/Gather_12_output_0 onnx::Unsqueeze_3492*/blocks.10/self_attn/Unsqueeze_28_output_0!/blocks.10/self_attn/Unsqueeze_28" Unsqueeze fonnx::Unsqueeze_3494 Constant_5376"Constant*5 value*)BConstant_5376_attr::valueJ  '/blocks.10/self_attn/Gather_13_output_0 onnx::Unsqueeze_3494*/blocks.10/self_attn/Unsqueeze_29_output_0!/blocks.10/self_attn/Unsqueeze_29" Unsqueeze  */blocks.10/self_attn/Unsqueeze_26_output_0 */blocks.10/self_attn/Unsqueeze_27_output_0 */blocks.10/self_attn/Unsqueeze_28_output_0 */blocks.10/self_attn/Unsqueeze_29_output_0'/blocks.10/self_attn/Concat_11_output_0/blocks.10/self_attn/Concat_11"Concat* axis  &/blocks.10/self_attn/Expand_1_output_0 '/blocks.10/self_attn/Concat_11_output_0'/blocks.10/self_attn/Reshape_6_output_0/blocks.10/self_attn/Reshape_6"Reshape* allowzero  '/blocks.10/self_attn/Transpose_output_0 '/blocks.10/self_attn/Reshape_4_output_0$/blocks.10/self_attn/MatMul_output_0/blocks.10/self_attn/MatMul"MatMul )/blocks.10/self_attn/Constant_56_output_0 /blocks.10/self_attn/Constant_56"Constant*B value*6B,/blocks.10/self_attn/Constant_56_attr::valueJ5A  $/blocks.10/self_attn/MatMul_output_0 )/blocks.10/self_attn/Constant_56_output_0#/blocks.10/self_attn/Div_2_output_0/blocks.10/self_attn/Div_2"Div { #/blocks.10/self_attn/Div_2_output_0 attention_mask#/blocks.10/self_attn/Add_2_output_0/blocks.10/self_attn/Add_2"Add  #/blocks.10/self_attn/Add_2_output_0%/blocks.10/self_attn/Softmax_output_0/blocks.10/self_attn/Softmax"Softmax* axis { %/blocks.10/self_attn/Softmax_output_0$/blocks.10/self_attn/Cast_4_output_0/blocks.10/self_attn/Cast_4"Cast* to  $/blocks.10/self_attn/Cast_4_output_0 '/blocks.10/self_attn/Reshape_6_output_0&/blocks.10/self_attn/MatMul_1_output_0/blocks.10/self_attn/MatMul_1"MatMul  &/blocks.10/self_attn/MatMul_1_output_0)/blocks.10/self_attn/Transpose_3_output_0 /blocks.10/self_attn/Transpose_3" Transpose* perm@@@@ fonnx::Unsqueeze_3506 Constant_5388"Constant*5 value*)BConstant_5388_attr::valueJ  $/blocks.10/self_attn/Gather_output_0 onnx::Unsqueeze_3506*/blocks.10/self_attn/Unsqueeze_30_output_0!/blocks.10/self_attn/Unsqueeze_30" Unsqueeze fonnx::Unsqueeze_3508 Constant_5390"Constant*5 value*)BConstant_5390_attr::valueJ  &/blocks.10/self_attn/Gather_1_output_0 onnx::Unsqueeze_3508*/blocks.10/self_attn/Unsqueeze_31_output_0!/blocks.10/self_attn/Unsqueeze_31" Unsqueeze )/blocks.10/self_attn/Constant_57_output_0 /blocks.10/self_attn/Constant_57"Constant*H value*<B,/blocks.10/self_attn/Constant_57_attr::valueJ  */blocks.10/self_attn/Unsqueeze_30_output_0 */blocks.10/self_attn/Unsqueeze_31_output_0 )/blocks.10/self_attn/Constant_57_output_0'/blocks.10/self_attn/Concat_12_output_0/blocks.10/self_attn/Concat_12"Concat* axis  )/blocks.10/self_attn/Transpose_3_output_0 '/blocks.10/self_attn/Concat_12_output_0'/blocks.10/self_attn/Reshape_7_output_0/blocks.10/self_attn/Reshape_7"Reshape* allowzero  '/blocks.10/self_attn/Reshape_7_output_0 onnx::MatMul_8869+/blocks.10/self_attn/o_proj/MatMul_output_0"/blocks.10/self_attn/o_proj/MatMul"MatMul  */blocks.10/input_layernorm/Cast_1_output_0 +/blocks.10/self_attn/o_proj/MatMul_output_0/blocks.10/Add_output_0/blocks.10/Add"Add  /blocks.10/Add_output_01/blocks.10/post_attention_layernorm/Cast_output_0(/blocks.10/post_attention_layernorm/Cast"Cast* to 5/blocks.10/post_attention_layernorm/Constant_output_0,/blocks.10/post_attention_layernorm/Constant"Constant*N value*BB8/blocks.10/post_attention_layernorm/Constant_attr::valueJ@  1/blocks.10/post_attention_layernorm/Cast_output_0 5/blocks.10/post_attention_layernorm/Constant_output_00/blocks.10/post_attention_layernorm/Pow_output_0'/blocks.10/post_attention_layernorm/Pow"Pow  0/blocks.10/post_attention_layernorm/Pow_output_07/blocks.10/post_attention_layernorm/ReduceMean_output_0./blocks.10/post_attention_layernorm/ReduceMean" ReduceMean* axes@* keepdims 7/blocks.10/post_attention_layernorm/Constant_1_output_0./blocks.10/post_attention_layernorm/Constant_1"Constant*P value*DB:/blocks.10/post_attention_layernorm/Constant_1_attr::valueJ75  7/blocks.10/post_attention_layernorm/ReduceMean_output_0 7/blocks.10/post_attention_layernorm/Constant_1_output_00/blocks.10/post_attention_layernorm/Add_output_0'/blocks.10/post_attention_layernorm/Add"Add  0/blocks.10/post_attention_layernorm/Add_output_01/blocks.10/post_attention_layernorm/Sqrt_output_0(/blocks.10/post_attention_layernorm/Sqrt"Sqrt 7/blocks.10/post_attention_layernorm/Constant_2_output_0./blocks.10/post_attention_layernorm/Constant_2"Constant*P value*DB:/blocks.10/post_attention_layernorm/Constant_2_attr::valueJ?  7/blocks.10/post_attention_layernorm/Constant_2_output_0 1/blocks.10/post_attention_layernorm/Sqrt_output_00/blocks.10/post_attention_layernorm/Div_output_0'/blocks.10/post_attention_layernorm/Div"Div  1/blocks.10/post_attention_layernorm/Cast_output_03/blocks.10/post_attention_layernorm/Cast_1_output_0*/blocks.10/post_attention_layernorm/Cast_1"Cast* to  3/blocks.10/post_attention_layernorm/Cast_1_output_0 0/blocks.10/post_attention_layernorm/Div_output_00/blocks.10/post_attention_layernorm/Mul_output_0'/blocks.10/post_attention_layernorm/Mul"Mul  0/blocks.10/post_attention_layernorm/Mul_output_0 )blocks.10.post_attention_layernorm.weight2/blocks.10/post_attention_layernorm/Mul_1_output_0)/blocks.10/post_attention_layernorm/Mul_1"Mul  2/blocks.10/post_attention_layernorm/Mul_1_output_03/blocks.10/post_attention_layernorm/Cast_2_output_0*/blocks.10/post_attention_layernorm/Cast_2"Cast* to  3/blocks.10/post_attention_layernorm/Cast_2_output_0 onnx::MatMul_8870(/blocks.10/mlp/gate_proj/MatMul_output_0/blocks.10/mlp/gate_proj/MatMul"MatMul z (/blocks.10/mlp/gate_proj/MatMul_output_0&/blocks.10/mlp/act_fn/Sigmoid_output_0/blocks.10/mlp/act_fn/Sigmoid"Sigmoid  (/blocks.10/mlp/gate_proj/MatMul_output_0 &/blocks.10/mlp/act_fn/Sigmoid_output_0"/blocks.10/mlp/act_fn/Mul_output_0/blocks.10/mlp/act_fn/Mul"Mul  3/blocks.10/post_attention_layernorm/Cast_2_output_0 onnx::MatMul_8871&/blocks.10/mlp/up_proj/MatMul_output_0/blocks.10/mlp/up_proj/MatMul"MatMul  "/blocks.10/mlp/act_fn/Mul_output_0 &/blocks.10/mlp/up_proj/MatMul_output_0/blocks.10/mlp/Mul_output_0/blocks.10/mlp/Mul"Mul  /blocks.10/mlp/Mul_output_0 onnx::MatMul_8872(/blocks.10/mlp/down_proj/MatMul_output_0/blocks.10/mlp/down_proj/MatMul"MatMul  3/blocks.10/post_attention_layernorm/Cast_1_output_0 (/blocks.10/mlp/down_proj/MatMul_output_0/blocks.10/Add_1_output_0/blocks.10/Add_1"Add `/Constant_4_output_0 /Constant_4"Constant*1 value*%B/Constant_4_attr::valueJ  ] past_key_values /Constant_4_output_0/Gather_11_output_0 /Gather_11"Gather* axis /blocks.11/Constant_output_0/blocks.11/Constant"Constant*K value*?B/blocks.11/Constant_attr::valueJ  /blocks.10/Add_1_output_0 /blocks.11/Constant_output_0/blocks.11/Reshape_output_0/blocks.11/Reshape"Reshape* allowzero y /blocks.11/Reshape_output_0(/blocks.11/input_layernorm/Cast_output_0/blocks.11/input_layernorm/Cast"Cast* to ,/blocks.11/input_layernorm/Constant_output_0#/blocks.11/input_layernorm/Constant"Constant*E value*9B//blocks.11/input_layernorm/Constant_attr::valueJ@  (/blocks.11/input_layernorm/Cast_output_0 ,/blocks.11/input_layernorm/Constant_output_0'/blocks.11/input_layernorm/Pow_output_0/blocks.11/input_layernorm/Pow"Pow  '/blocks.11/input_layernorm/Pow_output_0./blocks.11/input_layernorm/ReduceMean_output_0%/blocks.11/input_layernorm/ReduceMean" ReduceMean* axes@* keepdims ./blocks.11/input_layernorm/Constant_1_output_0%/blocks.11/input_layernorm/Constant_1"Constant*G value*;B1/blocks.11/input_layernorm/Constant_1_attr::valueJ75  ./blocks.11/input_layernorm/ReduceMean_output_0 ./blocks.11/input_layernorm/Constant_1_output_0'/blocks.11/input_layernorm/Add_output_0/blocks.11/input_layernorm/Add"Add z '/blocks.11/input_layernorm/Add_output_0(/blocks.11/input_layernorm/Sqrt_output_0/blocks.11/input_layernorm/Sqrt"Sqrt ./blocks.11/input_layernorm/Constant_2_output_0%/blocks.11/input_layernorm/Constant_2"Constant*G value*;B1/blocks.11/input_layernorm/Constant_2_attr::valueJ?  ./blocks.11/input_layernorm/Constant_2_output_0 (/blocks.11/input_layernorm/Sqrt_output_0'/blocks.11/input_layernorm/Div_output_0/blocks.11/input_layernorm/Div"Div  (/blocks.11/input_layernorm/Cast_output_0*/blocks.11/input_layernorm/Cast_1_output_0!/blocks.11/input_layernorm/Cast_1"Cast* to  */blocks.11/input_layernorm/Cast_1_output_0 '/blocks.11/input_layernorm/Div_output_0'/blocks.11/input_layernorm/Mul_output_0/blocks.11/input_layernorm/Mul"Mul  '/blocks.11/input_layernorm/Mul_output_0 blocks.11.input_layernorm.weight)/blocks.11/input_layernorm/Mul_1_output_0 /blocks.11/input_layernorm/Mul_1"Mul  )/blocks.11/input_layernorm/Mul_1_output_0*/blocks.11/input_layernorm/Cast_2_output_0!/blocks.11/input_layernorm/Cast_2"Cast* to t */blocks.11/input_layernorm/Cast_2_output_0#/blocks.11/self_attn/Shape_output_0/blocks.11/self_attn/Shape"Shape &/blocks.11/self_attn/Constant_output_0/blocks.11/self_attn/Constant"Constant*C value*7B)/blocks.11/self_attn/Constant_attr::valueJ  #/blocks.11/self_attn/Shape_output_0 &/blocks.11/self_attn/Constant_output_0$/blocks.11/self_attn/Gather_output_0/blocks.11/self_attn/Gather"Gather* axis x */blocks.11/input_layernorm/Cast_2_output_0%/blocks.11/self_attn/Shape_1_output_0/blocks.11/self_attn/Shape_1"Shape (/blocks.11/self_attn/Constant_1_output_0/blocks.11/self_attn/Constant_1"Constant*E value*9B+/blocks.11/self_attn/Constant_1_attr::valueJ  %/blocks.11/self_attn/Shape_1_output_0 (/blocks.11/self_attn/Constant_1_output_0&/blocks.11/self_attn/Gather_1_output_0/blocks.11/self_attn/Gather_1"Gather* axis  */blocks.11/input_layernorm/Cast_2_output_0 onnx::MatMul_8873+/blocks.11/self_attn/q_proj/MatMul_output_0"/blocks.11/self_attn/q_proj/MatMul"MatMul  */blocks.11/input_layernorm/Cast_2_output_0 onnx::MatMul_8874+/blocks.11/self_attn/k_proj/MatMul_output_0"/blocks.11/self_attn/k_proj/MatMul"MatMul  */blocks.11/input_layernorm/Cast_2_output_0 onnx::MatMul_8875+/blocks.11/self_attn/v_proj/MatMul_output_0"/blocks.11/self_attn/v_proj/MatMul"MatMul fonnx::Unsqueeze_3569 Constant_5443"Constant*5 value*)BConstant_5443_attr::valueJ  $/blocks.11/self_attn/Gather_output_0 onnx::Unsqueeze_3569'/blocks.11/self_attn/Unsqueeze_output_0/blocks.11/self_attn/Unsqueeze" Unsqueeze fonnx::Unsqueeze_3571 Constant_5445"Constant*5 value*)BConstant_5445_attr::valueJ  &/blocks.11/self_attn/Gather_1_output_0 onnx::Unsqueeze_3571)/blocks.11/self_attn/Unsqueeze_1_output_0 /blocks.11/self_attn/Unsqueeze_1" Unsqueeze (/blocks.11/self_attn/Constant_2_output_0/blocks.11/self_attn/Constant_2"Constant*G value*;B+/blocks.11/self_attn/Constant_2_attr::valueJ (/blocks.11/self_attn/Constant_3_output_0/blocks.11/self_attn/Constant_3"Constant*G value*;B+/blocks.11/self_attn/Constant_3_attr::valueJ  '/blocks.11/self_attn/Unsqueeze_output_0 )/blocks.11/self_attn/Unsqueeze_1_output_0 (/blocks.11/self_attn/Constant_2_output_0 (/blocks.11/self_attn/Constant_3_output_0$/blocks.11/self_attn/Concat_output_0/blocks.11/self_attn/Concat"Concat* axis  +/blocks.11/self_attn/q_proj/MatMul_output_0 $/blocks.11/self_attn/Concat_output_0%/blocks.11/self_attn/Reshape_output_0/blocks.11/self_attn/Reshape"Reshape* allowzero fonnx::Unsqueeze_3579 Constant_5451"Constant*5 value*)BConstant_5451_attr::valueJ  $/blocks.11/self_attn/Gather_output_0 onnx::Unsqueeze_3579)/blocks.11/self_attn/Unsqueeze_2_output_0 /blocks.11/self_attn/Unsqueeze_2" Unsqueeze fonnx::Unsqueeze_3581 Constant_5453"Constant*5 value*)BConstant_5453_attr::valueJ  &/blocks.11/self_attn/Gather_1_output_0 onnx::Unsqueeze_3581)/blocks.11/self_attn/Unsqueeze_3_output_0 /blocks.11/self_attn/Unsqueeze_3" Unsqueeze (/blocks.11/self_attn/Constant_4_output_0/blocks.11/self_attn/Constant_4"Constant*G value*;B+/blocks.11/self_attn/Constant_4_attr::valueJ (/blocks.11/self_attn/Constant_5_output_0/blocks.11/self_attn/Constant_5"Constant*G value*;B+/blocks.11/self_attn/Constant_5_attr::valueJ  )/blocks.11/self_attn/Unsqueeze_2_output_0 )/blocks.11/self_attn/Unsqueeze_3_output_0 (/blocks.11/self_attn/Constant_4_output_0 (/blocks.11/self_attn/Constant_5_output_0&/blocks.11/self_attn/Concat_1_output_0/blocks.11/self_attn/Concat_1"Concat* axis fonnx::Unsqueeze_3588 Constant_5458"Constant*5 value*)BConstant_5458_attr::valueJ  $/blocks.11/self_attn/Gather_output_0 onnx::Unsqueeze_3588)/blocks.11/self_attn/Unsqueeze_4_output_0 /blocks.11/self_attn/Unsqueeze_4" Unsqueeze fonnx::Unsqueeze_3590 Constant_5460"Constant*5 value*)BConstant_5460_attr::valueJ  &/blocks.11/self_attn/Gather_1_output_0 onnx::Unsqueeze_3590)/blocks.11/self_attn/Unsqueeze_5_output_0 /blocks.11/self_attn/Unsqueeze_5" Unsqueeze (/blocks.11/self_attn/Constant_6_output_0/blocks.11/self_attn/Constant_6"Constant*G value*;B+/blocks.11/self_attn/Constant_6_attr::valueJ (/blocks.11/self_attn/Constant_7_output_0/blocks.11/self_attn/Constant_7"Constant*G value*;B+/blocks.11/self_attn/Constant_7_attr::valueJ  )/blocks.11/self_attn/Unsqueeze_4_output_0 )/blocks.11/self_attn/Unsqueeze_5_output_0 (/blocks.11/self_attn/Constant_6_output_0 (/blocks.11/self_attn/Constant_7_output_0&/blocks.11/self_attn/Concat_2_output_0/blocks.11/self_attn/Concat_2"Concat* axis  +/blocks.11/self_attn/k_proj/MatMul_output_0 &/blocks.11/self_attn/Concat_1_output_0'/blocks.11/self_attn/Reshape_1_output_0/blocks.11/self_attn/Reshape_1"Reshape* allowzero  +/blocks.11/self_attn/v_proj/MatMul_output_0 &/blocks.11/self_attn/Concat_2_output_0'/blocks.11/self_attn/Reshape_2_output_0/blocks.11/self_attn/Reshape_2"Reshape* allowzero  %/blocks.11/self_attn/Reshape_output_0)/blocks.11/self_attn/q_norm/Cast_output_0 /blocks.11/self_attn/q_norm/Cast"Cast* to -/blocks.11/self_attn/q_norm/Constant_output_0$/blocks.11/self_attn/q_norm/Constant"Constant*F value*:B0/blocks.11/self_attn/q_norm/Constant_attr::valueJ@  )/blocks.11/self_attn/q_norm/Cast_output_0 -/blocks.11/self_attn/q_norm/Constant_output_0(/blocks.11/self_attn/q_norm/Pow_output_0/blocks.11/self_attn/q_norm/Pow"Pow  (/blocks.11/self_attn/q_norm/Pow_output_0//blocks.11/self_attn/q_norm/ReduceMean_output_0&/blocks.11/self_attn/q_norm/ReduceMean" ReduceMean* axes@* keepdims //blocks.11/self_attn/q_norm/Constant_1_output_0&/blocks.11/self_attn/q_norm/Constant_1"Constant*H value*<B2/blocks.11/self_attn/q_norm/Constant_1_attr::valueJ75  //blocks.11/self_attn/q_norm/ReduceMean_output_0 //blocks.11/self_attn/q_norm/Constant_1_output_0(/blocks.11/self_attn/q_norm/Add_output_0/blocks.11/self_attn/q_norm/Add"Add } (/blocks.11/self_attn/q_norm/Add_output_0)/blocks.11/self_attn/q_norm/Sqrt_output_0 /blocks.11/self_attn/q_norm/Sqrt"Sqrt //blocks.11/self_attn/q_norm/Constant_2_output_0&/blocks.11/self_attn/q_norm/Constant_2"Constant*H value*<B2/blocks.11/self_attn/q_norm/Constant_2_attr::valueJ?  //blocks.11/self_attn/q_norm/Constant_2_output_0 )/blocks.11/self_attn/q_norm/Sqrt_output_0(/blocks.11/self_attn/q_norm/Div_output_0/blocks.11/self_attn/q_norm/Div"Div  )/blocks.11/self_attn/q_norm/Cast_output_0+/blocks.11/self_attn/q_norm/Cast_1_output_0"/blocks.11/self_attn/q_norm/Cast_1"Cast* to  +/blocks.11/self_attn/q_norm/Cast_1_output_0 (/blocks.11/self_attn/q_norm/Div_output_0(/blocks.11/self_attn/q_norm/Mul_output_0/blocks.11/self_attn/q_norm/Mul"Mul  (/blocks.11/self_attn/q_norm/Mul_output_0 !blocks.11.self_attn.q_norm.weight*/blocks.11/self_attn/q_norm/Mul_1_output_0!/blocks.11/self_attn/q_norm/Mul_1"Mul  */blocks.11/self_attn/q_norm/Mul_1_output_0+/blocks.11/self_attn/q_norm/Cast_2_output_0"/blocks.11/self_attn/q_norm/Cast_2"Cast* to  '/blocks.11/self_attn/Reshape_1_output_0)/blocks.11/self_attn/k_norm/Cast_output_0 /blocks.11/self_attn/k_norm/Cast"Cast* to -/blocks.11/self_attn/k_norm/Constant_output_0$/blocks.11/self_attn/k_norm/Constant"Constant*F value*:B0/blocks.11/self_attn/k_norm/Constant_attr::valueJ@  )/blocks.11/self_attn/k_norm/Cast_output_0 -/blocks.11/self_attn/k_norm/Constant_output_0(/blocks.11/self_attn/k_norm/Pow_output_0/blocks.11/self_attn/k_norm/Pow"Pow  (/blocks.11/self_attn/k_norm/Pow_output_0//blocks.11/self_attn/k_norm/ReduceMean_output_0&/blocks.11/self_attn/k_norm/ReduceMean" ReduceMean* axes@* keepdims //blocks.11/self_attn/k_norm/Constant_1_output_0&/blocks.11/self_attn/k_norm/Constant_1"Constant*H value*<B2/blocks.11/self_attn/k_norm/Constant_1_attr::valueJ75  //blocks.11/self_attn/k_norm/ReduceMean_output_0 //blocks.11/self_attn/k_norm/Constant_1_output_0(/blocks.11/self_attn/k_norm/Add_output_0/blocks.11/self_attn/k_norm/Add"Add } (/blocks.11/self_attn/k_norm/Add_output_0)/blocks.11/self_attn/k_norm/Sqrt_output_0 /blocks.11/self_attn/k_norm/Sqrt"Sqrt //blocks.11/self_attn/k_norm/Constant_2_output_0&/blocks.11/self_attn/k_norm/Constant_2"Constant*H value*<B2/blocks.11/self_attn/k_norm/Constant_2_attr::valueJ?  //blocks.11/self_attn/k_norm/Constant_2_output_0 )/blocks.11/self_attn/k_norm/Sqrt_output_0(/blocks.11/self_attn/k_norm/Div_output_0/blocks.11/self_attn/k_norm/Div"Div  )/blocks.11/self_attn/k_norm/Cast_output_0+/blocks.11/self_attn/k_norm/Cast_1_output_0"/blocks.11/self_attn/k_norm/Cast_1"Cast* to  +/blocks.11/self_attn/k_norm/Cast_1_output_0 (/blocks.11/self_attn/k_norm/Div_output_0(/blocks.11/self_attn/k_norm/Mul_output_0/blocks.11/self_attn/k_norm/Mul"Mul  (/blocks.11/self_attn/k_norm/Mul_output_0 !blocks.11.self_attn.k_norm.weight*/blocks.11/self_attn/k_norm/Mul_1_output_0!/blocks.11/self_attn/k_norm/Mul_1"Mul  */blocks.11/self_attn/k_norm/Mul_1_output_0+/blocks.11/self_attn/k_norm/Cast_2_output_0"/blocks.11/self_attn/k_norm/Cast_2"Cast* to  +/blocks.11/self_attn/q_norm/Cast_2_output_0 %/blocks.0/self_attn/Gather_2_output_0!/blocks.11/self_attn/Mul_output_0/blocks.11/self_attn/Mul"Mul y +/blocks.11/self_attn/q_norm/Cast_2_output_0%/blocks.11/self_attn/Shape_2_output_0/blocks.11/self_attn/Shape_2"Shape (/blocks.11/self_attn/Constant_8_output_0/blocks.11/self_attn/Constant_8"Constant*E value*9B+/blocks.11/self_attn/Constant_8_attr::valueJ  %/blocks.11/self_attn/Shape_2_output_0 (/blocks.11/self_attn/Constant_8_output_0&/blocks.11/self_attn/Gather_2_output_0/blocks.11/self_attn/Gather_2"Gather* axis (/blocks.11/self_attn/Constant_9_output_0/blocks.11/self_attn/Constant_9"Constant*E value*9B+/blocks.11/self_attn/Constant_9_attr::valueJ  &/blocks.11/self_attn/Gather_2_output_0 (/blocks.11/self_attn/Constant_9_output_0!/blocks.11/self_attn/Div_output_0/blocks.11/self_attn/Div"Div s !/blocks.11/self_attn/Div_output_0"/blocks.11/self_attn/Cast_output_0/blocks.11/self_attn/Cast"Cast* to x "/blocks.11/self_attn/Cast_output_0$/blocks.11/self_attn/Cast_1_output_0/blocks.11/self_attn/Cast_1"Cast* to )/blocks.11/self_attn/Constant_10_output_0 /blocks.11/self_attn/Constant_10"Constant*H value*<B,/blocks.11/self_attn/Constant_10_attr::valueJ )/blocks.11/self_attn/Constant_11_output_0 /blocks.11/self_attn/Constant_11"Constant*H value*<B,/blocks.11/self_attn/Constant_11_attr::valueJ )/blocks.11/self_attn/Constant_12_output_0 /blocks.11/self_attn/Constant_12"Constant*H value*<B,/blocks.11/self_attn/Constant_12_attr::valueJ  $/blocks.11/self_attn/Cast_1_output_0 )/blocks.11/self_attn/Constant_12_output_0)/blocks.11/self_attn/Unsqueeze_6_output_0 /blocks.11/self_attn/Unsqueeze_6" Unsqueeze )/blocks.11/self_attn/Constant_13_output_0 /blocks.11/self_attn/Constant_13"Constant*H value*<B,/blocks.11/self_attn/Constant_13_attr::valueJ  +/blocks.11/self_attn/q_norm/Cast_2_output_0 )/blocks.11/self_attn/Constant_11_output_0 )/blocks.11/self_attn/Unsqueeze_6_output_0 )/blocks.11/self_attn/Constant_10_output_0 )/blocks.11/self_attn/Constant_13_output_0#/blocks.11/self_attn/Slice_output_0/blocks.11/self_attn/Slice"Slice )/blocks.11/self_attn/Constant_14_output_0 /blocks.11/self_attn/Constant_14"Constant*H value*<B,/blocks.11/self_attn/Constant_14_attr::valueJ )/blocks.11/self_attn/Constant_15_output_0 /blocks.11/self_attn/Constant_15"Constant*H value*<B,/blocks.11/self_attn/Constant_15_attr::valueJ  $/blocks.11/self_attn/Cast_1_output_0 )/blocks.11/self_attn/Constant_15_output_0)/blocks.11/self_attn/Unsqueeze_7_output_0 /blocks.11/self_attn/Unsqueeze_7" Unsqueeze )/blocks.11/self_attn/Constant_16_output_0 /blocks.11/self_attn/Constant_16"Constant*H value*<B,/blocks.11/self_attn/Constant_16_attr::valueJ )/blocks.11/self_attn/Constant_17_output_0 /blocks.11/self_attn/Constant_17"Constant*H value*<B,/blocks.11/self_attn/Constant_17_attr::valueJ  +/blocks.11/self_attn/q_norm/Cast_2_output_0 )/blocks.11/self_attn/Unsqueeze_7_output_0 )/blocks.11/self_attn/Constant_16_output_0 )/blocks.11/self_attn/Constant_14_output_0 )/blocks.11/self_attn/Constant_17_output_0%/blocks.11/self_attn/Slice_1_output_0/blocks.11/self_attn/Slice_1"Slice i %/blocks.11/self_attn/Slice_1_output_0!/blocks.11/self_attn/Neg_output_0/blocks.11/self_attn/Neg"Neg  !/blocks.11/self_attn/Neg_output_0 #/blocks.11/self_attn/Slice_output_0&/blocks.11/self_attn/Concat_3_output_0/blocks.11/self_attn/Concat_3"Concat* axis  &/blocks.11/self_attn/Concat_3_output_0 %/blocks.0/self_attn/Gather_3_output_0#/blocks.11/self_attn/Mul_1_output_0/blocks.11/self_attn/Mul_1"Mul  !/blocks.11/self_attn/Mul_output_0 #/blocks.11/self_attn/Mul_1_output_0!/blocks.11/self_attn/Add_output_0/blocks.11/self_attn/Add"Add  +/blocks.11/self_attn/k_norm/Cast_2_output_0 %/blocks.0/self_attn/Gather_2_output_0#/blocks.11/self_attn/Mul_2_output_0/blocks.11/self_attn/Mul_2"Mul y +/blocks.11/self_attn/k_norm/Cast_2_output_0%/blocks.11/self_attn/Shape_3_output_0/blocks.11/self_attn/Shape_3"Shape )/blocks.11/self_attn/Constant_18_output_0 /blocks.11/self_attn/Constant_18"Constant*F value*:B,/blocks.11/self_attn/Constant_18_attr::valueJ  %/blocks.11/self_attn/Shape_3_output_0 )/blocks.11/self_attn/Constant_18_output_0&/blocks.11/self_attn/Gather_3_output_0/blocks.11/self_attn/Gather_3"Gather* axis )/blocks.11/self_attn/Constant_19_output_0 /blocks.11/self_attn/Constant_19"Constant*F value*:B,/blocks.11/self_attn/Constant_19_attr::valueJ  &/blocks.11/self_attn/Gather_3_output_0 )/blocks.11/self_attn/Constant_19_output_0#/blocks.11/self_attn/Div_1_output_0/blocks.11/self_attn/Div_1"Div y #/blocks.11/self_attn/Div_1_output_0$/blocks.11/self_attn/Cast_2_output_0/blocks.11/self_attn/Cast_2"Cast* to z $/blocks.11/self_attn/Cast_2_output_0$/blocks.11/self_attn/Cast_3_output_0/blocks.11/self_attn/Cast_3"Cast* to )/blocks.11/self_attn/Constant_20_output_0 /blocks.11/self_attn/Constant_20"Constant*H value*<B,/blocks.11/self_attn/Constant_20_attr::valueJ )/blocks.11/self_attn/Constant_21_output_0 /blocks.11/self_attn/Constant_21"Constant*H value*<B,/blocks.11/self_attn/Constant_21_attr::valueJ )/blocks.11/self_attn/Constant_22_output_0 /blocks.11/self_attn/Constant_22"Constant*H value*<B,/blocks.11/self_attn/Constant_22_attr::valueJ  $/blocks.11/self_attn/Cast_3_output_0 )/blocks.11/self_attn/Constant_22_output_0)/blocks.11/self_attn/Unsqueeze_8_output_0 /blocks.11/self_attn/Unsqueeze_8" Unsqueeze )/blocks.11/self_attn/Constant_23_output_0 /blocks.11/self_attn/Constant_23"Constant*H value*<B,/blocks.11/self_attn/Constant_23_attr::valueJ  +/blocks.11/self_attn/k_norm/Cast_2_output_0 )/blocks.11/self_attn/Constant_21_output_0 )/blocks.11/self_attn/Unsqueeze_8_output_0 )/blocks.11/self_attn/Constant_20_output_0 )/blocks.11/self_attn/Constant_23_output_0%/blocks.11/self_attn/Slice_2_output_0/blocks.11/self_attn/Slice_2"Slice )/blocks.11/self_attn/Constant_24_output_0 /blocks.11/self_attn/Constant_24"Constant*H value*<B,/blocks.11/self_attn/Constant_24_attr::valueJ )/blocks.11/self_attn/Constant_25_output_0 /blocks.11/self_attn/Constant_25"Constant*H value*<B,/blocks.11/self_attn/Constant_25_attr::valueJ  $/blocks.11/self_attn/Cast_3_output_0 )/blocks.11/self_attn/Constant_25_output_0)/blocks.11/self_attn/Unsqueeze_9_output_0 /blocks.11/self_attn/Unsqueeze_9" Unsqueeze )/blocks.11/self_attn/Constant_26_output_0 /blocks.11/self_attn/Constant_26"Constant*H value*<B,/blocks.11/self_attn/Constant_26_attr::valueJ )/blocks.11/self_attn/Constant_27_output_0 /blocks.11/self_attn/Constant_27"Constant*H value*<B,/blocks.11/self_attn/Constant_27_attr::valueJ  +/blocks.11/self_attn/k_norm/Cast_2_output_0 )/blocks.11/self_attn/Unsqueeze_9_output_0 )/blocks.11/self_attn/Constant_26_output_0 )/blocks.11/self_attn/Constant_24_output_0 )/blocks.11/self_attn/Constant_27_output_0%/blocks.11/self_attn/Slice_3_output_0/blocks.11/self_attn/Slice_3"Slice m %/blocks.11/self_attn/Slice_3_output_0#/blocks.11/self_attn/Neg_1_output_0/blocks.11/self_attn/Neg_1"Neg  #/blocks.11/self_attn/Neg_1_output_0 %/blocks.11/self_attn/Slice_2_output_0&/blocks.11/self_attn/Concat_4_output_0/blocks.11/self_attn/Concat_4"Concat* axis  &/blocks.11/self_attn/Concat_4_output_0 %/blocks.0/self_attn/Gather_3_output_0#/blocks.11/self_attn/Mul_3_output_0/blocks.11/self_attn/Mul_3"Mul  #/blocks.11/self_attn/Mul_2_output_0 #/blocks.11/self_attn/Mul_3_output_0#/blocks.11/self_attn/Add_1_output_0/blocks.11/self_attn/Add_1"Add  /Gather_11_output_0 /rotary/Constant_3_output_0&/blocks.11/self_attn/Gather_4_output_0/blocks.11/self_attn/Gather_4"Gather* axis  /Gather_11_output_0 /rotary/Constant_8_output_0&/blocks.11/self_attn/Gather_5_output_0/blocks.11/self_attn/Gather_5"Gather* axis  &/blocks.11/self_attn/Gather_4_output_0 #/blocks.11/self_attn/Add_1_output_0&/blocks.11/self_attn/Concat_5_output_0/blocks.11/self_attn/Concat_5"Concat* axis  &/blocks.11/self_attn/Gather_5_output_0 '/blocks.11/self_attn/Reshape_2_output_0&/blocks.11/self_attn/Concat_6_output_0/blocks.11/self_attn/Concat_6"Concat* axis )/blocks.11/self_attn/Constant_28_output_0 /blocks.11/self_attn/Constant_28"Constant*H value*<B,/blocks.11/self_attn/Constant_28_attr::valueJ  &/blocks.11/self_attn/Concat_5_output_0 )/blocks.11/self_attn/Constant_28_output_0*/blocks.11/self_attn/Unsqueeze_10_output_0!/blocks.11/self_attn/Unsqueeze_10" Unsqueeze )/blocks.11/self_attn/Constant_29_output_0 /blocks.11/self_attn/Constant_29"Constant*H value*<B,/blocks.11/self_attn/Constant_29_attr::valueJ  &/blocks.11/self_attn/Concat_6_output_0 )/blocks.11/self_attn/Constant_29_output_0*/blocks.11/self_attn/Unsqueeze_11_output_0!/blocks.11/self_attn/Unsqueeze_11" Unsqueeze  */blocks.11/self_attn/Unsqueeze_10_output_0 */blocks.11/self_attn/Unsqueeze_11_output_0&/blocks.11/self_attn/Concat_7_output_0/blocks.11/self_attn/Concat_7"Concat* axis  !/blocks.11/self_attn/Add_output_0'/blocks.11/self_attn/Transpose_output_0/blocks.11/self_attn/Transpose" Transpose* perm@@@@  &/blocks.11/self_attn/Concat_5_output_0)/blocks.11/self_attn/Transpose_1_output_0 /blocks.11/self_attn/Transpose_1" Transpose* perm@@@@  &/blocks.11/self_attn/Concat_6_output_0)/blocks.11/self_attn/Transpose_2_output_0 /blocks.11/self_attn/Transpose_2" Transpose* perm@@@@ w )/blocks.11/self_attn/Transpose_1_output_0%/blocks.11/self_attn/Shape_4_output_0/blocks.11/self_attn/Shape_4"Shape )/blocks.11/self_attn/Constant_30_output_0 /blocks.11/self_attn/Constant_30"Constant*F value*:B,/blocks.11/self_attn/Constant_30_attr::valueJ  %/blocks.11/self_attn/Shape_4_output_0 )/blocks.11/self_attn/Constant_30_output_0&/blocks.11/self_attn/Gather_6_output_0/blocks.11/self_attn/Gather_6"Gather* axis w )/blocks.11/self_attn/Transpose_1_output_0%/blocks.11/self_attn/Shape_5_output_0/blocks.11/self_attn/Shape_5"Shape )/blocks.11/self_attn/Constant_31_output_0 /blocks.11/self_attn/Constant_31"Constant*F value*:B,/blocks.11/self_attn/Constant_31_attr::valueJ  %/blocks.11/self_attn/Shape_5_output_0 )/blocks.11/self_attn/Constant_31_output_0&/blocks.11/self_attn/Gather_7_output_0/blocks.11/self_attn/Gather_7"Gather* axis w )/blocks.11/self_attn/Transpose_1_output_0%/blocks.11/self_attn/Shape_6_output_0/blocks.11/self_attn/Shape_6"Shape )/blocks.11/self_attn/Constant_32_output_0 /blocks.11/self_attn/Constant_32"Constant*F value*:B,/blocks.11/self_attn/Constant_32_attr::valueJ  %/blocks.11/self_attn/Shape_6_output_0 )/blocks.11/self_attn/Constant_32_output_0&/blocks.11/self_attn/Gather_8_output_0/blocks.11/self_attn/Gather_8"Gather* axis w )/blocks.11/self_attn/Transpose_1_output_0%/blocks.11/self_attn/Shape_7_output_0/blocks.11/self_attn/Shape_7"Shape )/blocks.11/self_attn/Constant_33_output_0 /blocks.11/self_attn/Constant_33"Constant*F value*:B,/blocks.11/self_attn/Constant_33_attr::valueJ  %/blocks.11/self_attn/Shape_7_output_0 )/blocks.11/self_attn/Constant_33_output_0&/blocks.11/self_attn/Gather_9_output_0/blocks.11/self_attn/Gather_9"Gather* axis )/blocks.11/self_attn/Constant_34_output_0 /blocks.11/self_attn/Constant_34"Constant*H value*<B,/blocks.11/self_attn/Constant_34_attr::valueJ  )/blocks.11/self_attn/Transpose_1_output_0 )/blocks.11/self_attn/Constant_34_output_0*/blocks.11/self_attn/Unsqueeze_12_output_0!/blocks.11/self_attn/Unsqueeze_12" Unsqueeze )/blocks.11/self_attn/Constant_35_output_0 /blocks.11/self_attn/Constant_35"Constant*H value*<B,/blocks.11/self_attn/Constant_35_attr::valueJ  &/blocks.11/self_attn/Gather_6_output_0 )/blocks.11/self_attn/Constant_35_output_0*/blocks.11/self_attn/Unsqueeze_13_output_0!/blocks.11/self_attn/Unsqueeze_13" Unsqueeze )/blocks.11/self_attn/Constant_36_output_0 /blocks.11/self_attn/Constant_36"Constant*H value*<B,/blocks.11/self_attn/Constant_36_attr::valueJ  &/blocks.11/self_attn/Gather_7_output_0 )/blocks.11/self_attn/Constant_36_output_0*/blocks.11/self_attn/Unsqueeze_14_output_0!/blocks.11/self_attn/Unsqueeze_14" Unsqueeze )/blocks.11/self_attn/Constant_37_output_0 /blocks.11/self_attn/Constant_37"Constant*H value*<B,/blocks.11/self_attn/Constant_37_attr::valueJ )/blocks.11/self_attn/Constant_38_output_0 /blocks.11/self_attn/Constant_38"Constant*H value*<B,/blocks.11/self_attn/Constant_38_attr::valueJ  &/blocks.11/self_attn/Gather_8_output_0 )/blocks.11/self_attn/Constant_38_output_0*/blocks.11/self_attn/Unsqueeze_15_output_0!/blocks.11/self_attn/Unsqueeze_15" Unsqueeze )/blocks.11/self_attn/Constant_39_output_0 /blocks.11/self_attn/Constant_39"Constant*H value*<B,/blocks.11/self_attn/Constant_39_attr::valueJ  &/blocks.11/self_attn/Gather_9_output_0 )/blocks.11/self_attn/Constant_39_output_0*/blocks.11/self_attn/Unsqueeze_16_output_0!/blocks.11/self_attn/Unsqueeze_16" Unsqueeze  */blocks.11/self_attn/Unsqueeze_13_output_0 */blocks.11/self_attn/Unsqueeze_14_output_0 )/blocks.11/self_attn/Constant_37_output_0 */blocks.11/self_attn/Unsqueeze_15_output_0 */blocks.11/self_attn/Unsqueeze_16_output_0&/blocks.11/self_attn/Concat_8_output_0/blocks.11/self_attn/Concat_8"Concat* axis )/blocks.11/self_attn/Constant_40_output_0 /blocks.11/self_attn/Constant_40"Constant*H value*<B,/blocks.11/self_attn/Constant_40_attr::valueJ  &/blocks.11/self_attn/Concat_8_output_0 )/blocks.11/self_attn/Constant_40_output_0'/blocks.11/self_attn/Reshape_3_output_0/blocks.11/self_attn/Reshape_3"Reshape* allowzero u '/blocks.11/self_attn/Reshape_3_output_0%/blocks.11/self_attn/Shape_8_output_0/blocks.11/self_attn/Shape_8"Shape  %/blocks.11/self_attn/Shape_8_output_0-/blocks.11/self_attn/ConstantOfShape_output_0$/blocks.11/self_attn/ConstantOfShape"ConstantOfShape*L value*@B0/blocks.11/self_attn/ConstantOfShape_attr::valueJ )/blocks.11/self_attn/Constant_41_output_0 /blocks.11/self_attn/Constant_41"Constant*F value*:B,/blocks.11/self_attn/Constant_41_attr::valueJ  -/blocks.11/self_attn/ConstantOfShape_output_0 )/blocks.11/self_attn/Constant_41_output_0#/blocks.11/self_attn/Mul_4_output_0/blocks.11/self_attn/Mul_4"Mul  '/blocks.11/self_attn/Reshape_3_output_0 #/blocks.11/self_attn/Mul_4_output_0#/blocks.11/self_attn/Equal_output_0/blocks.11/self_attn/Equal"Equal  #/blocks.11/self_attn/Equal_output_0 -/blocks.11/self_attn/ConstantOfShape_output_0 '/blocks.11/self_attn/Reshape_3_output_0#/blocks.11/self_attn/Where_output_0/blocks.11/self_attn/Where"Where  */blocks.11/self_attn/Unsqueeze_12_output_0 #/blocks.11/self_attn/Where_output_0$/blocks.11/self_attn/Expand_output_0/blocks.11/self_attn/Expand"Expand )/blocks.11/self_attn/Constant_42_output_0 /blocks.11/self_attn/Constant_42"Constant*F value*:B,/blocks.11/self_attn/Constant_42_attr::valueJ  &/blocks.11/self_attn/Gather_7_output_0 )/blocks.11/self_attn/Constant_42_output_0#/blocks.11/self_attn/Mul_5_output_0/blocks.11/self_attn/Mul_5"Mul fonnx::Unsqueeze_3733 Constant_5588"Constant*5 value*)BConstant_5588_attr::valueJ  &/blocks.11/self_attn/Gather_6_output_0 onnx::Unsqueeze_3733*/blocks.11/self_attn/Unsqueeze_17_output_0!/blocks.11/self_attn/Unsqueeze_17" Unsqueeze fonnx::Unsqueeze_3735 Constant_5590"Constant*5 value*)BConstant_5590_attr::valueJ  #/blocks.11/self_attn/Mul_5_output_0 onnx::Unsqueeze_3735*/blocks.11/self_attn/Unsqueeze_18_output_0!/blocks.11/self_attn/Unsqueeze_18" Unsqueeze fonnx::Unsqueeze_3737 Constant_5592"Constant*5 value*)BConstant_5592_attr::valueJ  &/blocks.11/self_attn/Gather_8_output_0 onnx::Unsqueeze_3737*/blocks.11/self_attn/Unsqueeze_19_output_0!/blocks.11/self_attn/Unsqueeze_19" Unsqueeze fonnx::Unsqueeze_3739 Constant_5594"Constant*5 value*)BConstant_5594_attr::valueJ  &/blocks.11/self_attn/Gather_9_output_0 onnx::Unsqueeze_3739*/blocks.11/self_attn/Unsqueeze_20_output_0!/blocks.11/self_attn/Unsqueeze_20" Unsqueeze  */blocks.11/self_attn/Unsqueeze_17_output_0 */blocks.11/self_attn/Unsqueeze_18_output_0 */blocks.11/self_attn/Unsqueeze_19_output_0 */blocks.11/self_attn/Unsqueeze_20_output_0&/blocks.11/self_attn/Concat_9_output_0/blocks.11/self_attn/Concat_9"Concat* axis  $/blocks.11/self_attn/Expand_output_0 &/blocks.11/self_attn/Concat_9_output_0'/blocks.11/self_attn/Reshape_4_output_0/blocks.11/self_attn/Reshape_4"Reshape* allowzero w )/blocks.11/self_attn/Transpose_2_output_0%/blocks.11/self_attn/Shape_9_output_0/blocks.11/self_attn/Shape_9"Shape )/blocks.11/self_attn/Constant_43_output_0 /blocks.11/self_attn/Constant_43"Constant*F value*:B,/blocks.11/self_attn/Constant_43_attr::valueJ  %/blocks.11/self_attn/Shape_9_output_0 )/blocks.11/self_attn/Constant_43_output_0'/blocks.11/self_attn/Gather_10_output_0/blocks.11/self_attn/Gather_10"Gather* axis y )/blocks.11/self_attn/Transpose_2_output_0&/blocks.11/self_attn/Shape_10_output_0/blocks.11/self_attn/Shape_10"Shape )/blocks.11/self_attn/Constant_44_output_0 /blocks.11/self_attn/Constant_44"Constant*F value*:B,/blocks.11/self_attn/Constant_44_attr::valueJ  &/blocks.11/self_attn/Shape_10_output_0 )/blocks.11/self_attn/Constant_44_output_0'/blocks.11/self_attn/Gather_11_output_0/blocks.11/self_attn/Gather_11"Gather* axis y )/blocks.11/self_attn/Transpose_2_output_0&/blocks.11/self_attn/Shape_11_output_0/blocks.11/self_attn/Shape_11"Shape )/blocks.11/self_attn/Constant_45_output_0 /blocks.11/self_attn/Constant_45"Constant*F value*:B,/blocks.11/self_attn/Constant_45_attr::valueJ  &/blocks.11/self_attn/Shape_11_output_0 )/blocks.11/self_attn/Constant_45_output_0'/blocks.11/self_attn/Gather_12_output_0/blocks.11/self_attn/Gather_12"Gather* axis y )/blocks.11/self_attn/Transpose_2_output_0&/blocks.11/self_attn/Shape_12_output_0/blocks.11/self_attn/Shape_12"Shape )/blocks.11/self_attn/Constant_46_output_0 /blocks.11/self_attn/Constant_46"Constant*F value*:B,/blocks.11/self_attn/Constant_46_attr::valueJ  &/blocks.11/self_attn/Shape_12_output_0 )/blocks.11/self_attn/Constant_46_output_0'/blocks.11/self_attn/Gather_13_output_0/blocks.11/self_attn/Gather_13"Gather* axis )/blocks.11/self_attn/Constant_47_output_0 /blocks.11/self_attn/Constant_47"Constant*H value*<B,/blocks.11/self_attn/Constant_47_attr::valueJ  )/blocks.11/self_attn/Transpose_2_output_0 )/blocks.11/self_attn/Constant_47_output_0*/blocks.11/self_attn/Unsqueeze_21_output_0!/blocks.11/self_attn/Unsqueeze_21" Unsqueeze )/blocks.11/self_attn/Constant_48_output_0 /blocks.11/self_attn/Constant_48"Constant*H value*<B,/blocks.11/self_attn/Constant_48_attr::valueJ  '/blocks.11/self_attn/Gather_10_output_0 )/blocks.11/self_attn/Constant_48_output_0*/blocks.11/self_attn/Unsqueeze_22_output_0!/blocks.11/self_attn/Unsqueeze_22" Unsqueeze )/blocks.11/self_attn/Constant_49_output_0 /blocks.11/self_attn/Constant_49"Constant*H value*<B,/blocks.11/self_attn/Constant_49_attr::valueJ  '/blocks.11/self_attn/Gather_11_output_0 )/blocks.11/self_attn/Constant_49_output_0*/blocks.11/self_attn/Unsqueeze_23_output_0!/blocks.11/self_attn/Unsqueeze_23" Unsqueeze )/blocks.11/self_attn/Constant_50_output_0 /blocks.11/self_attn/Constant_50"Constant*H value*<B,/blocks.11/self_attn/Constant_50_attr::valueJ )/blocks.11/self_attn/Constant_51_output_0 /blocks.11/self_attn/Constant_51"Constant*H value*<B,/blocks.11/self_attn/Constant_51_attr::valueJ  '/blocks.11/self_attn/Gather_12_output_0 )/blocks.11/self_attn/Constant_51_output_0*/blocks.11/self_attn/Unsqueeze_24_output_0!/blocks.11/self_attn/Unsqueeze_24" Unsqueeze )/blocks.11/self_attn/Constant_52_output_0 /blocks.11/self_attn/Constant_52"Constant*H value*<B,/blocks.11/self_attn/Constant_52_attr::valueJ  '/blocks.11/self_attn/Gather_13_output_0 )/blocks.11/self_attn/Constant_52_output_0*/blocks.11/self_attn/Unsqueeze_25_output_0!/blocks.11/self_attn/Unsqueeze_25" Unsqueeze  */blocks.11/self_attn/Unsqueeze_22_output_0 */blocks.11/self_attn/Unsqueeze_23_output_0 )/blocks.11/self_attn/Constant_50_output_0 */blocks.11/self_attn/Unsqueeze_24_output_0 */blocks.11/self_attn/Unsqueeze_25_output_0'/blocks.11/self_attn/Concat_10_output_0/blocks.11/self_attn/Concat_10"Concat* axis )/blocks.11/self_attn/Constant_53_output_0 /blocks.11/self_attn/Constant_53"Constant*H value*<B,/blocks.11/self_attn/Constant_53_attr::valueJ  '/blocks.11/self_attn/Concat_10_output_0 )/blocks.11/self_attn/Constant_53_output_0'/blocks.11/self_attn/Reshape_5_output_0/blocks.11/self_attn/Reshape_5"Reshape* allowzero w '/blocks.11/self_attn/Reshape_5_output_0&/blocks.11/self_attn/Shape_13_output_0/blocks.11/self_attn/Shape_13"Shape  &/blocks.11/self_attn/Shape_13_output_0//blocks.11/self_attn/ConstantOfShape_1_output_0&/blocks.11/self_attn/ConstantOfShape_1"ConstantOfShape*N value*BB2/blocks.11/self_attn/ConstantOfShape_1_attr::valueJ )/blocks.11/self_attn/Constant_54_output_0 /blocks.11/self_attn/Constant_54"Constant*F value*:B,/blocks.11/self_attn/Constant_54_attr::valueJ  //blocks.11/self_attn/ConstantOfShape_1_output_0 )/blocks.11/self_attn/Constant_54_output_0#/blocks.11/self_attn/Mul_6_output_0/blocks.11/self_attn/Mul_6"Mul  '/blocks.11/self_attn/Reshape_5_output_0 #/blocks.11/self_attn/Mul_6_output_0%/blocks.11/self_attn/Equal_1_output_0/blocks.11/self_attn/Equal_1"Equal  %/blocks.11/self_attn/Equal_1_output_0 //blocks.11/self_attn/ConstantOfShape_1_output_0 '/blocks.11/self_attn/Reshape_5_output_0%/blocks.11/self_attn/Where_1_output_0/blocks.11/self_attn/Where_1"Where  */blocks.11/self_attn/Unsqueeze_21_output_0 %/blocks.11/self_attn/Where_1_output_0&/blocks.11/self_attn/Expand_1_output_0/blocks.11/self_attn/Expand_1"Expand )/blocks.11/self_attn/Constant_55_output_0 /blocks.11/self_attn/Constant_55"Constant*F value*:B,/blocks.11/self_attn/Constant_55_attr::valueJ  '/blocks.11/self_attn/Gather_11_output_0 )/blocks.11/self_attn/Constant_55_output_0#/blocks.11/self_attn/Mul_7_output_0/blocks.11/self_attn/Mul_7"Mul fonnx::Unsqueeze_3779 Constant_5633"Constant*5 value*)BConstant_5633_attr::valueJ  '/blocks.11/self_attn/Gather_10_output_0 onnx::Unsqueeze_3779*/blocks.11/self_attn/Unsqueeze_26_output_0!/blocks.11/self_attn/Unsqueeze_26" Unsqueeze fonnx::Unsqueeze_3781 Constant_5635"Constant*5 value*)BConstant_5635_attr::valueJ  #/blocks.11/self_attn/Mul_7_output_0 onnx::Unsqueeze_3781*/blocks.11/self_attn/Unsqueeze_27_output_0!/blocks.11/self_attn/Unsqueeze_27" Unsqueeze fonnx::Unsqueeze_3783 Constant_5637"Constant*5 value*)BConstant_5637_attr::valueJ  '/blocks.11/self_attn/Gather_12_output_0 onnx::Unsqueeze_3783*/blocks.11/self_attn/Unsqueeze_28_output_0!/blocks.11/self_attn/Unsqueeze_28" Unsqueeze fonnx::Unsqueeze_3785 Constant_5639"Constant*5 value*)BConstant_5639_attr::valueJ  '/blocks.11/self_attn/Gather_13_output_0 onnx::Unsqueeze_3785*/blocks.11/self_attn/Unsqueeze_29_output_0!/blocks.11/self_attn/Unsqueeze_29" Unsqueeze  */blocks.11/self_attn/Unsqueeze_26_output_0 */blocks.11/self_attn/Unsqueeze_27_output_0 */blocks.11/self_attn/Unsqueeze_28_output_0 */blocks.11/self_attn/Unsqueeze_29_output_0'/blocks.11/self_attn/Concat_11_output_0/blocks.11/self_attn/Concat_11"Concat* axis  &/blocks.11/self_attn/Expand_1_output_0 '/blocks.11/self_attn/Concat_11_output_0'/blocks.11/self_attn/Reshape_6_output_0/blocks.11/self_attn/Reshape_6"Reshape* allowzero  '/blocks.11/self_attn/Transpose_output_0 '/blocks.11/self_attn/Reshape_4_output_0$/blocks.11/self_attn/MatMul_output_0/blocks.11/self_attn/MatMul"MatMul )/blocks.11/self_attn/Constant_56_output_0 /blocks.11/self_attn/Constant_56"Constant*B value*6B,/blocks.11/self_attn/Constant_56_attr::valueJ5A  $/blocks.11/self_attn/MatMul_output_0 )/blocks.11/self_attn/Constant_56_output_0#/blocks.11/self_attn/Div_2_output_0/blocks.11/self_attn/Div_2"Div { #/blocks.11/self_attn/Div_2_output_0 attention_mask#/blocks.11/self_attn/Add_2_output_0/blocks.11/self_attn/Add_2"Add  #/blocks.11/self_attn/Add_2_output_0%/blocks.11/self_attn/Softmax_output_0/blocks.11/self_attn/Softmax"Softmax* axis { %/blocks.11/self_attn/Softmax_output_0$/blocks.11/self_attn/Cast_4_output_0/blocks.11/self_attn/Cast_4"Cast* to  $/blocks.11/self_attn/Cast_4_output_0 '/blocks.11/self_attn/Reshape_6_output_0&/blocks.11/self_attn/MatMul_1_output_0/blocks.11/self_attn/MatMul_1"MatMul  &/blocks.11/self_attn/MatMul_1_output_0)/blocks.11/self_attn/Transpose_3_output_0 /blocks.11/self_attn/Transpose_3" Transpose* perm@@@@ fonnx::Unsqueeze_3797 Constant_5651"Constant*5 value*)BConstant_5651_attr::valueJ  $/blocks.11/self_attn/Gather_output_0 onnx::Unsqueeze_3797*/blocks.11/self_attn/Unsqueeze_30_output_0!/blocks.11/self_attn/Unsqueeze_30" Unsqueeze fonnx::Unsqueeze_3799 Constant_5653"Constant*5 value*)BConstant_5653_attr::valueJ  &/blocks.11/self_attn/Gather_1_output_0 onnx::Unsqueeze_3799*/blocks.11/self_attn/Unsqueeze_31_output_0!/blocks.11/self_attn/Unsqueeze_31" Unsqueeze )/blocks.11/self_attn/Constant_57_output_0 /blocks.11/self_attn/Constant_57"Constant*H value*<B,/blocks.11/self_attn/Constant_57_attr::valueJ  */blocks.11/self_attn/Unsqueeze_30_output_0 */blocks.11/self_attn/Unsqueeze_31_output_0 )/blocks.11/self_attn/Constant_57_output_0'/blocks.11/self_attn/Concat_12_output_0/blocks.11/self_attn/Concat_12"Concat* axis  )/blocks.11/self_attn/Transpose_3_output_0 '/blocks.11/self_attn/Concat_12_output_0'/blocks.11/self_attn/Reshape_7_output_0/blocks.11/self_attn/Reshape_7"Reshape* allowzero  '/blocks.11/self_attn/Reshape_7_output_0 onnx::MatMul_8897+/blocks.11/self_attn/o_proj/MatMul_output_0"/blocks.11/self_attn/o_proj/MatMul"MatMul  */blocks.11/input_layernorm/Cast_1_output_0 +/blocks.11/self_attn/o_proj/MatMul_output_0/blocks.11/Add_output_0/blocks.11/Add"Add  /blocks.11/Add_output_01/blocks.11/post_attention_layernorm/Cast_output_0(/blocks.11/post_attention_layernorm/Cast"Cast* to 5/blocks.11/post_attention_layernorm/Constant_output_0,/blocks.11/post_attention_layernorm/Constant"Constant*N value*BB8/blocks.11/post_attention_layernorm/Constant_attr::valueJ@  1/blocks.11/post_attention_layernorm/Cast_output_0 5/blocks.11/post_attention_layernorm/Constant_output_00/blocks.11/post_attention_layernorm/Pow_output_0'/blocks.11/post_attention_layernorm/Pow"Pow  0/blocks.11/post_attention_layernorm/Pow_output_07/blocks.11/post_attention_layernorm/ReduceMean_output_0./blocks.11/post_attention_layernorm/ReduceMean" ReduceMean* axes@* keepdims 7/blocks.11/post_attention_layernorm/Constant_1_output_0./blocks.11/post_attention_layernorm/Constant_1"Constant*P value*DB:/blocks.11/post_attention_layernorm/Constant_1_attr::valueJ75  7/blocks.11/post_attention_layernorm/ReduceMean_output_0 7/blocks.11/post_attention_layernorm/Constant_1_output_00/blocks.11/post_attention_layernorm/Add_output_0'/blocks.11/post_attention_layernorm/Add"Add  0/blocks.11/post_attention_layernorm/Add_output_01/blocks.11/post_attention_layernorm/Sqrt_output_0(/blocks.11/post_attention_layernorm/Sqrt"Sqrt 7/blocks.11/post_attention_layernorm/Constant_2_output_0./blocks.11/post_attention_layernorm/Constant_2"Constant*P value*DB:/blocks.11/post_attention_layernorm/Constant_2_attr::valueJ?  7/blocks.11/post_attention_layernorm/Constant_2_output_0 1/blocks.11/post_attention_layernorm/Sqrt_output_00/blocks.11/post_attention_layernorm/Div_output_0'/blocks.11/post_attention_layernorm/Div"Div  1/blocks.11/post_attention_layernorm/Cast_output_03/blocks.11/post_attention_layernorm/Cast_1_output_0*/blocks.11/post_attention_layernorm/Cast_1"Cast* to  3/blocks.11/post_attention_layernorm/Cast_1_output_0 0/blocks.11/post_attention_layernorm/Div_output_00/blocks.11/post_attention_layernorm/Mul_output_0'/blocks.11/post_attention_layernorm/Mul"Mul  0/blocks.11/post_attention_layernorm/Mul_output_0 )blocks.11.post_attention_layernorm.weight2/blocks.11/post_attention_layernorm/Mul_1_output_0)/blocks.11/post_attention_layernorm/Mul_1"Mul  2/blocks.11/post_attention_layernorm/Mul_1_output_03/blocks.11/post_attention_layernorm/Cast_2_output_0*/blocks.11/post_attention_layernorm/Cast_2"Cast* to  3/blocks.11/post_attention_layernorm/Cast_2_output_0 onnx::MatMul_8898(/blocks.11/mlp/gate_proj/MatMul_output_0/blocks.11/mlp/gate_proj/MatMul"MatMul z (/blocks.11/mlp/gate_proj/MatMul_output_0&/blocks.11/mlp/act_fn/Sigmoid_output_0/blocks.11/mlp/act_fn/Sigmoid"Sigmoid  (/blocks.11/mlp/gate_proj/MatMul_output_0 &/blocks.11/mlp/act_fn/Sigmoid_output_0"/blocks.11/mlp/act_fn/Mul_output_0/blocks.11/mlp/act_fn/Mul"Mul  3/blocks.11/post_attention_layernorm/Cast_2_output_0 onnx::MatMul_8899&/blocks.11/mlp/up_proj/MatMul_output_0/blocks.11/mlp/up_proj/MatMul"MatMul  "/blocks.11/mlp/act_fn/Mul_output_0 &/blocks.11/mlp/up_proj/MatMul_output_0/blocks.11/mlp/Mul_output_0/blocks.11/mlp/Mul"Mul  /blocks.11/mlp/Mul_output_0 onnx::MatMul_8900(/blocks.11/mlp/down_proj/MatMul_output_0/blocks.11/mlp/down_proj/MatMul"MatMul  3/blocks.11/post_attention_layernorm/Cast_1_output_0 (/blocks.11/mlp/down_proj/MatMul_output_0/blocks.11/Add_1_output_0/blocks.11/Add_1"Add `/Constant_5_output_0 /Constant_5"Constant*1 value*%B/Constant_5_attr::valueJ  ] past_key_values /Constant_5_output_0/Gather_12_output_0 /Gather_12"Gather* axis /blocks.12/Constant_output_0/blocks.12/Constant"Constant*K value*?B/blocks.12/Constant_attr::valueJ  /blocks.11/Add_1_output_0 /blocks.12/Constant_output_0/blocks.12/Reshape_output_0/blocks.12/Reshape"Reshape* allowzero y /blocks.12/Reshape_output_0(/blocks.12/input_layernorm/Cast_output_0/blocks.12/input_layernorm/Cast"Cast* to ,/blocks.12/input_layernorm/Constant_output_0#/blocks.12/input_layernorm/Constant"Constant*E value*9B//blocks.12/input_layernorm/Constant_attr::valueJ@  (/blocks.12/input_layernorm/Cast_output_0 ,/blocks.12/input_layernorm/Constant_output_0'/blocks.12/input_layernorm/Pow_output_0/blocks.12/input_layernorm/Pow"Pow  '/blocks.12/input_layernorm/Pow_output_0./blocks.12/input_layernorm/ReduceMean_output_0%/blocks.12/input_layernorm/ReduceMean" ReduceMean* axes@* keepdims ./blocks.12/input_layernorm/Constant_1_output_0%/blocks.12/input_layernorm/Constant_1"Constant*G value*;B1/blocks.12/input_layernorm/Constant_1_attr::valueJ75  ./blocks.12/input_layernorm/ReduceMean_output_0 ./blocks.12/input_layernorm/Constant_1_output_0'/blocks.12/input_layernorm/Add_output_0/blocks.12/input_layernorm/Add"Add z '/blocks.12/input_layernorm/Add_output_0(/blocks.12/input_layernorm/Sqrt_output_0/blocks.12/input_layernorm/Sqrt"Sqrt ./blocks.12/input_layernorm/Constant_2_output_0%/blocks.12/input_layernorm/Constant_2"Constant*G value*;B1/blocks.12/input_layernorm/Constant_2_attr::valueJ?  ./blocks.12/input_layernorm/Constant_2_output_0 (/blocks.12/input_layernorm/Sqrt_output_0'/blocks.12/input_layernorm/Div_output_0/blocks.12/input_layernorm/Div"Div  (/blocks.12/input_layernorm/Cast_output_0*/blocks.12/input_layernorm/Cast_1_output_0!/blocks.12/input_layernorm/Cast_1"Cast* to  */blocks.12/input_layernorm/Cast_1_output_0 '/blocks.12/input_layernorm/Div_output_0'/blocks.12/input_layernorm/Mul_output_0/blocks.12/input_layernorm/Mul"Mul  '/blocks.12/input_layernorm/Mul_output_0 blocks.12.input_layernorm.weight)/blocks.12/input_layernorm/Mul_1_output_0 /blocks.12/input_layernorm/Mul_1"Mul  )/blocks.12/input_layernorm/Mul_1_output_0*/blocks.12/input_layernorm/Cast_2_output_0!/blocks.12/input_layernorm/Cast_2"Cast* to t */blocks.12/input_layernorm/Cast_2_output_0#/blocks.12/self_attn/Shape_output_0/blocks.12/self_attn/Shape"Shape &/blocks.12/self_attn/Constant_output_0/blocks.12/self_attn/Constant"Constant*C value*7B)/blocks.12/self_attn/Constant_attr::valueJ  #/blocks.12/self_attn/Shape_output_0 &/blocks.12/self_attn/Constant_output_0$/blocks.12/self_attn/Gather_output_0/blocks.12/self_attn/Gather"Gather* axis x */blocks.12/input_layernorm/Cast_2_output_0%/blocks.12/self_attn/Shape_1_output_0/blocks.12/self_attn/Shape_1"Shape (/blocks.12/self_attn/Constant_1_output_0/blocks.12/self_attn/Constant_1"Constant*E value*9B+/blocks.12/self_attn/Constant_1_attr::valueJ  %/blocks.12/self_attn/Shape_1_output_0 (/blocks.12/self_attn/Constant_1_output_0&/blocks.12/self_attn/Gather_1_output_0/blocks.12/self_attn/Gather_1"Gather* axis  */blocks.12/input_layernorm/Cast_2_output_0 onnx::MatMul_8901+/blocks.12/self_attn/q_proj/MatMul_output_0"/blocks.12/self_attn/q_proj/MatMul"MatMul  */blocks.12/input_layernorm/Cast_2_output_0 onnx::MatMul_8902+/blocks.12/self_attn/k_proj/MatMul_output_0"/blocks.12/self_attn/k_proj/MatMul"MatMul  */blocks.12/input_layernorm/Cast_2_output_0 onnx::MatMul_8903+/blocks.12/self_attn/v_proj/MatMul_output_0"/blocks.12/self_attn/v_proj/MatMul"MatMul fonnx::Unsqueeze_3860 Constant_5706"Constant*5 value*)BConstant_5706_attr::valueJ  $/blocks.12/self_attn/Gather_output_0 onnx::Unsqueeze_3860'/blocks.12/self_attn/Unsqueeze_output_0/blocks.12/self_attn/Unsqueeze" Unsqueeze fonnx::Unsqueeze_3862 Constant_5708"Constant*5 value*)BConstant_5708_attr::valueJ  &/blocks.12/self_attn/Gather_1_output_0 onnx::Unsqueeze_3862)/blocks.12/self_attn/Unsqueeze_1_output_0 /blocks.12/self_attn/Unsqueeze_1" Unsqueeze (/blocks.12/self_attn/Constant_2_output_0/blocks.12/self_attn/Constant_2"Constant*G value*;B+/blocks.12/self_attn/Constant_2_attr::valueJ (/blocks.12/self_attn/Constant_3_output_0/blocks.12/self_attn/Constant_3"Constant*G value*;B+/blocks.12/self_attn/Constant_3_attr::valueJ  '/blocks.12/self_attn/Unsqueeze_output_0 )/blocks.12/self_attn/Unsqueeze_1_output_0 (/blocks.12/self_attn/Constant_2_output_0 (/blocks.12/self_attn/Constant_3_output_0$/blocks.12/self_attn/Concat_output_0/blocks.12/self_attn/Concat"Concat* axis  +/blocks.12/self_attn/q_proj/MatMul_output_0 $/blocks.12/self_attn/Concat_output_0%/blocks.12/self_attn/Reshape_output_0/blocks.12/self_attn/Reshape"Reshape* allowzero fonnx::Unsqueeze_3870 Constant_5714"Constant*5 value*)BConstant_5714_attr::valueJ  $/blocks.12/self_attn/Gather_output_0 onnx::Unsqueeze_3870)/blocks.12/self_attn/Unsqueeze_2_output_0 /blocks.12/self_attn/Unsqueeze_2" Unsqueeze fonnx::Unsqueeze_3872 Constant_5716"Constant*5 value*)BConstant_5716_attr::valueJ  &/blocks.12/self_attn/Gather_1_output_0 onnx::Unsqueeze_3872)/blocks.12/self_attn/Unsqueeze_3_output_0 /blocks.12/self_attn/Unsqueeze_3" Unsqueeze (/blocks.12/self_attn/Constant_4_output_0/blocks.12/self_attn/Constant_4"Constant*G value*;B+/blocks.12/self_attn/Constant_4_attr::valueJ (/blocks.12/self_attn/Constant_5_output_0/blocks.12/self_attn/Constant_5"Constant*G value*;B+/blocks.12/self_attn/Constant_5_attr::valueJ  )/blocks.12/self_attn/Unsqueeze_2_output_0 )/blocks.12/self_attn/Unsqueeze_3_output_0 (/blocks.12/self_attn/Constant_4_output_0 (/blocks.12/self_attn/Constant_5_output_0&/blocks.12/self_attn/Concat_1_output_0/blocks.12/self_attn/Concat_1"Concat* axis fonnx::Unsqueeze_3879 Constant_5721"Constant*5 value*)BConstant_5721_attr::valueJ  $/blocks.12/self_attn/Gather_output_0 onnx::Unsqueeze_3879)/blocks.12/self_attn/Unsqueeze_4_output_0 /blocks.12/self_attn/Unsqueeze_4" Unsqueeze fonnx::Unsqueeze_3881 Constant_5723"Constant*5 value*)BConstant_5723_attr::valueJ  &/blocks.12/self_attn/Gather_1_output_0 onnx::Unsqueeze_3881)/blocks.12/self_attn/Unsqueeze_5_output_0 /blocks.12/self_attn/Unsqueeze_5" Unsqueeze (/blocks.12/self_attn/Constant_6_output_0/blocks.12/self_attn/Constant_6"Constant*G value*;B+/blocks.12/self_attn/Constant_6_attr::valueJ (/blocks.12/self_attn/Constant_7_output_0/blocks.12/self_attn/Constant_7"Constant*G value*;B+/blocks.12/self_attn/Constant_7_attr::valueJ  )/blocks.12/self_attn/Unsqueeze_4_output_0 )/blocks.12/self_attn/Unsqueeze_5_output_0 (/blocks.12/self_attn/Constant_6_output_0 (/blocks.12/self_attn/Constant_7_output_0&/blocks.12/self_attn/Concat_2_output_0/blocks.12/self_attn/Concat_2"Concat* axis  +/blocks.12/self_attn/k_proj/MatMul_output_0 &/blocks.12/self_attn/Concat_1_output_0'/blocks.12/self_attn/Reshape_1_output_0/blocks.12/self_attn/Reshape_1"Reshape* allowzero  +/blocks.12/self_attn/v_proj/MatMul_output_0 &/blocks.12/self_attn/Concat_2_output_0'/blocks.12/self_attn/Reshape_2_output_0/blocks.12/self_attn/Reshape_2"Reshape* allowzero  %/blocks.12/self_attn/Reshape_output_0)/blocks.12/self_attn/q_norm/Cast_output_0 /blocks.12/self_attn/q_norm/Cast"Cast* to -/blocks.12/self_attn/q_norm/Constant_output_0$/blocks.12/self_attn/q_norm/Constant"Constant*F value*:B0/blocks.12/self_attn/q_norm/Constant_attr::valueJ@  )/blocks.12/self_attn/q_norm/Cast_output_0 -/blocks.12/self_attn/q_norm/Constant_output_0(/blocks.12/self_attn/q_norm/Pow_output_0/blocks.12/self_attn/q_norm/Pow"Pow  (/blocks.12/self_attn/q_norm/Pow_output_0//blocks.12/self_attn/q_norm/ReduceMean_output_0&/blocks.12/self_attn/q_norm/ReduceMean" ReduceMean* axes@* keepdims //blocks.12/self_attn/q_norm/Constant_1_output_0&/blocks.12/self_attn/q_norm/Constant_1"Constant*H value*<B2/blocks.12/self_attn/q_norm/Constant_1_attr::valueJ75  //blocks.12/self_attn/q_norm/ReduceMean_output_0 //blocks.12/self_attn/q_norm/Constant_1_output_0(/blocks.12/self_attn/q_norm/Add_output_0/blocks.12/self_attn/q_norm/Add"Add } (/blocks.12/self_attn/q_norm/Add_output_0)/blocks.12/self_attn/q_norm/Sqrt_output_0 /blocks.12/self_attn/q_norm/Sqrt"Sqrt //blocks.12/self_attn/q_norm/Constant_2_output_0&/blocks.12/self_attn/q_norm/Constant_2"Constant*H value*<B2/blocks.12/self_attn/q_norm/Constant_2_attr::valueJ?  //blocks.12/self_attn/q_norm/Constant_2_output_0 )/blocks.12/self_attn/q_norm/Sqrt_output_0(/blocks.12/self_attn/q_norm/Div_output_0/blocks.12/self_attn/q_norm/Div"Div  )/blocks.12/self_attn/q_norm/Cast_output_0+/blocks.12/self_attn/q_norm/Cast_1_output_0"/blocks.12/self_attn/q_norm/Cast_1"Cast* to  +/blocks.12/self_attn/q_norm/Cast_1_output_0 (/blocks.12/self_attn/q_norm/Div_output_0(/blocks.12/self_attn/q_norm/Mul_output_0/blocks.12/self_attn/q_norm/Mul"Mul  (/blocks.12/self_attn/q_norm/Mul_output_0 !blocks.12.self_attn.q_norm.weight*/blocks.12/self_attn/q_norm/Mul_1_output_0!/blocks.12/self_attn/q_norm/Mul_1"Mul  */blocks.12/self_attn/q_norm/Mul_1_output_0+/blocks.12/self_attn/q_norm/Cast_2_output_0"/blocks.12/self_attn/q_norm/Cast_2"Cast* to  '/blocks.12/self_attn/Reshape_1_output_0)/blocks.12/self_attn/k_norm/Cast_output_0 /blocks.12/self_attn/k_norm/Cast"Cast* to -/blocks.12/self_attn/k_norm/Constant_output_0$/blocks.12/self_attn/k_norm/Constant"Constant*F value*:B0/blocks.12/self_attn/k_norm/Constant_attr::valueJ@  )/blocks.12/self_attn/k_norm/Cast_output_0 -/blocks.12/self_attn/k_norm/Constant_output_0(/blocks.12/self_attn/k_norm/Pow_output_0/blocks.12/self_attn/k_norm/Pow"Pow  (/blocks.12/self_attn/k_norm/Pow_output_0//blocks.12/self_attn/k_norm/ReduceMean_output_0&/blocks.12/self_attn/k_norm/ReduceMean" ReduceMean* axes@* keepdims //blocks.12/self_attn/k_norm/Constant_1_output_0&/blocks.12/self_attn/k_norm/Constant_1"Constant*H value*<B2/blocks.12/self_attn/k_norm/Constant_1_attr::valueJ75  //blocks.12/self_attn/k_norm/ReduceMean_output_0 //blocks.12/self_attn/k_norm/Constant_1_output_0(/blocks.12/self_attn/k_norm/Add_output_0/blocks.12/self_attn/k_norm/Add"Add } (/blocks.12/self_attn/k_norm/Add_output_0)/blocks.12/self_attn/k_norm/Sqrt_output_0 /blocks.12/self_attn/k_norm/Sqrt"Sqrt //blocks.12/self_attn/k_norm/Constant_2_output_0&/blocks.12/self_attn/k_norm/Constant_2"Constant*H value*<B2/blocks.12/self_attn/k_norm/Constant_2_attr::valueJ?  //blocks.12/self_attn/k_norm/Constant_2_output_0 )/blocks.12/self_attn/k_norm/Sqrt_output_0(/blocks.12/self_attn/k_norm/Div_output_0/blocks.12/self_attn/k_norm/Div"Div  )/blocks.12/self_attn/k_norm/Cast_output_0+/blocks.12/self_attn/k_norm/Cast_1_output_0"/blocks.12/self_attn/k_norm/Cast_1"Cast* to  +/blocks.12/self_attn/k_norm/Cast_1_output_0 (/blocks.12/self_attn/k_norm/Div_output_0(/blocks.12/self_attn/k_norm/Mul_output_0/blocks.12/self_attn/k_norm/Mul"Mul  (/blocks.12/self_attn/k_norm/Mul_output_0 !blocks.12.self_attn.k_norm.weight*/blocks.12/self_attn/k_norm/Mul_1_output_0!/blocks.12/self_attn/k_norm/Mul_1"Mul  */blocks.12/self_attn/k_norm/Mul_1_output_0+/blocks.12/self_attn/k_norm/Cast_2_output_0"/blocks.12/self_attn/k_norm/Cast_2"Cast* to  +/blocks.12/self_attn/q_norm/Cast_2_output_0 %/blocks.0/self_attn/Gather_2_output_0!/blocks.12/self_attn/Mul_output_0/blocks.12/self_attn/Mul"Mul y +/blocks.12/self_attn/q_norm/Cast_2_output_0%/blocks.12/self_attn/Shape_2_output_0/blocks.12/self_attn/Shape_2"Shape (/blocks.12/self_attn/Constant_8_output_0/blocks.12/self_attn/Constant_8"Constant*E value*9B+/blocks.12/self_attn/Constant_8_attr::valueJ  %/blocks.12/self_attn/Shape_2_output_0 (/blocks.12/self_attn/Constant_8_output_0&/blocks.12/self_attn/Gather_2_output_0/blocks.12/self_attn/Gather_2"Gather* axis (/blocks.12/self_attn/Constant_9_output_0/blocks.12/self_attn/Constant_9"Constant*E value*9B+/blocks.12/self_attn/Constant_9_attr::valueJ  &/blocks.12/self_attn/Gather_2_output_0 (/blocks.12/self_attn/Constant_9_output_0!/blocks.12/self_attn/Div_output_0/blocks.12/self_attn/Div"Div s !/blocks.12/self_attn/Div_output_0"/blocks.12/self_attn/Cast_output_0/blocks.12/self_attn/Cast"Cast* to x "/blocks.12/self_attn/Cast_output_0$/blocks.12/self_attn/Cast_1_output_0/blocks.12/self_attn/Cast_1"Cast* to )/blocks.12/self_attn/Constant_10_output_0 /blocks.12/self_attn/Constant_10"Constant*H value*<B,/blocks.12/self_attn/Constant_10_attr::valueJ )/blocks.12/self_attn/Constant_11_output_0 /blocks.12/self_attn/Constant_11"Constant*H value*<B,/blocks.12/self_attn/Constant_11_attr::valueJ )/blocks.12/self_attn/Constant_12_output_0 /blocks.12/self_attn/Constant_12"Constant*H value*<B,/blocks.12/self_attn/Constant_12_attr::valueJ  $/blocks.12/self_attn/Cast_1_output_0 )/blocks.12/self_attn/Constant_12_output_0)/blocks.12/self_attn/Unsqueeze_6_output_0 /blocks.12/self_attn/Unsqueeze_6" Unsqueeze )/blocks.12/self_attn/Constant_13_output_0 /blocks.12/self_attn/Constant_13"Constant*H value*<B,/blocks.12/self_attn/Constant_13_attr::valueJ  +/blocks.12/self_attn/q_norm/Cast_2_output_0 )/blocks.12/self_attn/Constant_11_output_0 )/blocks.12/self_attn/Unsqueeze_6_output_0 )/blocks.12/self_attn/Constant_10_output_0 )/blocks.12/self_attn/Constant_13_output_0#/blocks.12/self_attn/Slice_output_0/blocks.12/self_attn/Slice"Slice )/blocks.12/self_attn/Constant_14_output_0 /blocks.12/self_attn/Constant_14"Constant*H value*<B,/blocks.12/self_attn/Constant_14_attr::valueJ )/blocks.12/self_attn/Constant_15_output_0 /blocks.12/self_attn/Constant_15"Constant*H value*<B,/blocks.12/self_attn/Constant_15_attr::valueJ  $/blocks.12/self_attn/Cast_1_output_0 )/blocks.12/self_attn/Constant_15_output_0)/blocks.12/self_attn/Unsqueeze_7_output_0 /blocks.12/self_attn/Unsqueeze_7" Unsqueeze )/blocks.12/self_attn/Constant_16_output_0 /blocks.12/self_attn/Constant_16"Constant*H value*<B,/blocks.12/self_attn/Constant_16_attr::valueJ )/blocks.12/self_attn/Constant_17_output_0 /blocks.12/self_attn/Constant_17"Constant*H value*<B,/blocks.12/self_attn/Constant_17_attr::valueJ  +/blocks.12/self_attn/q_norm/Cast_2_output_0 )/blocks.12/self_attn/Unsqueeze_7_output_0 )/blocks.12/self_attn/Constant_16_output_0 )/blocks.12/self_attn/Constant_14_output_0 )/blocks.12/self_attn/Constant_17_output_0%/blocks.12/self_attn/Slice_1_output_0/blocks.12/self_attn/Slice_1"Slice i %/blocks.12/self_attn/Slice_1_output_0!/blocks.12/self_attn/Neg_output_0/blocks.12/self_attn/Neg"Neg  !/blocks.12/self_attn/Neg_output_0 #/blocks.12/self_attn/Slice_output_0&/blocks.12/self_attn/Concat_3_output_0/blocks.12/self_attn/Concat_3"Concat* axis  &/blocks.12/self_attn/Concat_3_output_0 %/blocks.0/self_attn/Gather_3_output_0#/blocks.12/self_attn/Mul_1_output_0/blocks.12/self_attn/Mul_1"Mul  !/blocks.12/self_attn/Mul_output_0 #/blocks.12/self_attn/Mul_1_output_0!/blocks.12/self_attn/Add_output_0/blocks.12/self_attn/Add"Add  +/blocks.12/self_attn/k_norm/Cast_2_output_0 %/blocks.0/self_attn/Gather_2_output_0#/blocks.12/self_attn/Mul_2_output_0/blocks.12/self_attn/Mul_2"Mul y +/blocks.12/self_attn/k_norm/Cast_2_output_0%/blocks.12/self_attn/Shape_3_output_0/blocks.12/self_attn/Shape_3"Shape )/blocks.12/self_attn/Constant_18_output_0 /blocks.12/self_attn/Constant_18"Constant*F value*:B,/blocks.12/self_attn/Constant_18_attr::valueJ  %/blocks.12/self_attn/Shape_3_output_0 )/blocks.12/self_attn/Constant_18_output_0&/blocks.12/self_attn/Gather_3_output_0/blocks.12/self_attn/Gather_3"Gather* axis )/blocks.12/self_attn/Constant_19_output_0 /blocks.12/self_attn/Constant_19"Constant*F value*:B,/blocks.12/self_attn/Constant_19_attr::valueJ  &/blocks.12/self_attn/Gather_3_output_0 )/blocks.12/self_attn/Constant_19_output_0#/blocks.12/self_attn/Div_1_output_0/blocks.12/self_attn/Div_1"Div y #/blocks.12/self_attn/Div_1_output_0$/blocks.12/self_attn/Cast_2_output_0/blocks.12/self_attn/Cast_2"Cast* to z $/blocks.12/self_attn/Cast_2_output_0$/blocks.12/self_attn/Cast_3_output_0/blocks.12/self_attn/Cast_3"Cast* to )/blocks.12/self_attn/Constant_20_output_0 /blocks.12/self_attn/Constant_20"Constant*H value*<B,/blocks.12/self_attn/Constant_20_attr::valueJ )/blocks.12/self_attn/Constant_21_output_0 /blocks.12/self_attn/Constant_21"Constant*H value*<B,/blocks.12/self_attn/Constant_21_attr::valueJ )/blocks.12/self_attn/Constant_22_output_0 /blocks.12/self_attn/Constant_22"Constant*H value*<B,/blocks.12/self_attn/Constant_22_attr::valueJ  $/blocks.12/self_attn/Cast_3_output_0 )/blocks.12/self_attn/Constant_22_output_0)/blocks.12/self_attn/Unsqueeze_8_output_0 /blocks.12/self_attn/Unsqueeze_8" Unsqueeze )/blocks.12/self_attn/Constant_23_output_0 /blocks.12/self_attn/Constant_23"Constant*H value*<B,/blocks.12/self_attn/Constant_23_attr::valueJ  +/blocks.12/self_attn/k_norm/Cast_2_output_0 )/blocks.12/self_attn/Constant_21_output_0 )/blocks.12/self_attn/Unsqueeze_8_output_0 )/blocks.12/self_attn/Constant_20_output_0 )/blocks.12/self_attn/Constant_23_output_0%/blocks.12/self_attn/Slice_2_output_0/blocks.12/self_attn/Slice_2"Slice )/blocks.12/self_attn/Constant_24_output_0 /blocks.12/self_attn/Constant_24"Constant*H value*<B,/blocks.12/self_attn/Constant_24_attr::valueJ )/blocks.12/self_attn/Constant_25_output_0 /blocks.12/self_attn/Constant_25"Constant*H value*<B,/blocks.12/self_attn/Constant_25_attr::valueJ  $/blocks.12/self_attn/Cast_3_output_0 )/blocks.12/self_attn/Constant_25_output_0)/blocks.12/self_attn/Unsqueeze_9_output_0 /blocks.12/self_attn/Unsqueeze_9" Unsqueeze )/blocks.12/self_attn/Constant_26_output_0 /blocks.12/self_attn/Constant_26"Constant*H value*<B,/blocks.12/self_attn/Constant_26_attr::valueJ )/blocks.12/self_attn/Constant_27_output_0 /blocks.12/self_attn/Constant_27"Constant*H value*<B,/blocks.12/self_attn/Constant_27_attr::valueJ  +/blocks.12/self_attn/k_norm/Cast_2_output_0 )/blocks.12/self_attn/Unsqueeze_9_output_0 )/blocks.12/self_attn/Constant_26_output_0 )/blocks.12/self_attn/Constant_24_output_0 )/blocks.12/self_attn/Constant_27_output_0%/blocks.12/self_attn/Slice_3_output_0/blocks.12/self_attn/Slice_3"Slice m %/blocks.12/self_attn/Slice_3_output_0#/blocks.12/self_attn/Neg_1_output_0/blocks.12/self_attn/Neg_1"Neg  #/blocks.12/self_attn/Neg_1_output_0 %/blocks.12/self_attn/Slice_2_output_0&/blocks.12/self_attn/Concat_4_output_0/blocks.12/self_attn/Concat_4"Concat* axis  &/blocks.12/self_attn/Concat_4_output_0 %/blocks.0/self_attn/Gather_3_output_0#/blocks.12/self_attn/Mul_3_output_0/blocks.12/self_attn/Mul_3"Mul  #/blocks.12/self_attn/Mul_2_output_0 #/blocks.12/self_attn/Mul_3_output_0#/blocks.12/self_attn/Add_1_output_0/blocks.12/self_attn/Add_1"Add  /Gather_12_output_0 /rotary/Constant_3_output_0&/blocks.12/self_attn/Gather_4_output_0/blocks.12/self_attn/Gather_4"Gather* axis  /Gather_12_output_0 /rotary/Constant_8_output_0&/blocks.12/self_attn/Gather_5_output_0/blocks.12/self_attn/Gather_5"Gather* axis  &/blocks.12/self_attn/Gather_4_output_0 #/blocks.12/self_attn/Add_1_output_0&/blocks.12/self_attn/Concat_5_output_0/blocks.12/self_attn/Concat_5"Concat* axis  &/blocks.12/self_attn/Gather_5_output_0 '/blocks.12/self_attn/Reshape_2_output_0&/blocks.12/self_attn/Concat_6_output_0/blocks.12/self_attn/Concat_6"Concat* axis )/blocks.12/self_attn/Constant_28_output_0 /blocks.12/self_attn/Constant_28"Constant*H value*<B,/blocks.12/self_attn/Constant_28_attr::valueJ  &/blocks.12/self_attn/Concat_5_output_0 )/blocks.12/self_attn/Constant_28_output_0*/blocks.12/self_attn/Unsqueeze_10_output_0!/blocks.12/self_attn/Unsqueeze_10" Unsqueeze )/blocks.12/self_attn/Constant_29_output_0 /blocks.12/self_attn/Constant_29"Constant*H value*<B,/blocks.12/self_attn/Constant_29_attr::valueJ  &/blocks.12/self_attn/Concat_6_output_0 )/blocks.12/self_attn/Constant_29_output_0*/blocks.12/self_attn/Unsqueeze_11_output_0!/blocks.12/self_attn/Unsqueeze_11" Unsqueeze  */blocks.12/self_attn/Unsqueeze_10_output_0 */blocks.12/self_attn/Unsqueeze_11_output_0&/blocks.12/self_attn/Concat_7_output_0/blocks.12/self_attn/Concat_7"Concat* axis  !/blocks.12/self_attn/Add_output_0'/blocks.12/self_attn/Transpose_output_0/blocks.12/self_attn/Transpose" Transpose* perm@@@@  &/blocks.12/self_attn/Concat_5_output_0)/blocks.12/self_attn/Transpose_1_output_0 /blocks.12/self_attn/Transpose_1" Transpose* perm@@@@  &/blocks.12/self_attn/Concat_6_output_0)/blocks.12/self_attn/Transpose_2_output_0 /blocks.12/self_attn/Transpose_2" Transpose* perm@@@@ w )/blocks.12/self_attn/Transpose_1_output_0%/blocks.12/self_attn/Shape_4_output_0/blocks.12/self_attn/Shape_4"Shape )/blocks.12/self_attn/Constant_30_output_0 /blocks.12/self_attn/Constant_30"Constant*F value*:B,/blocks.12/self_attn/Constant_30_attr::valueJ  %/blocks.12/self_attn/Shape_4_output_0 )/blocks.12/self_attn/Constant_30_output_0&/blocks.12/self_attn/Gather_6_output_0/blocks.12/self_attn/Gather_6"Gather* axis w )/blocks.12/self_attn/Transpose_1_output_0%/blocks.12/self_attn/Shape_5_output_0/blocks.12/self_attn/Shape_5"Shape )/blocks.12/self_attn/Constant_31_output_0 /blocks.12/self_attn/Constant_31"Constant*F value*:B,/blocks.12/self_attn/Constant_31_attr::valueJ  %/blocks.12/self_attn/Shape_5_output_0 )/blocks.12/self_attn/Constant_31_output_0&/blocks.12/self_attn/Gather_7_output_0/blocks.12/self_attn/Gather_7"Gather* axis w )/blocks.12/self_attn/Transpose_1_output_0%/blocks.12/self_attn/Shape_6_output_0/blocks.12/self_attn/Shape_6"Shape )/blocks.12/self_attn/Constant_32_output_0 /blocks.12/self_attn/Constant_32"Constant*F value*:B,/blocks.12/self_attn/Constant_32_attr::valueJ  %/blocks.12/self_attn/Shape_6_output_0 )/blocks.12/self_attn/Constant_32_output_0&/blocks.12/self_attn/Gather_8_output_0/blocks.12/self_attn/Gather_8"Gather* axis w )/blocks.12/self_attn/Transpose_1_output_0%/blocks.12/self_attn/Shape_7_output_0/blocks.12/self_attn/Shape_7"Shape )/blocks.12/self_attn/Constant_33_output_0 /blocks.12/self_attn/Constant_33"Constant*F value*:B,/blocks.12/self_attn/Constant_33_attr::valueJ  %/blocks.12/self_attn/Shape_7_output_0 )/blocks.12/self_attn/Constant_33_output_0&/blocks.12/self_attn/Gather_9_output_0/blocks.12/self_attn/Gather_9"Gather* axis )/blocks.12/self_attn/Constant_34_output_0 /blocks.12/self_attn/Constant_34"Constant*H value*<B,/blocks.12/self_attn/Constant_34_attr::valueJ  )/blocks.12/self_attn/Transpose_1_output_0 )/blocks.12/self_attn/Constant_34_output_0*/blocks.12/self_attn/Unsqueeze_12_output_0!/blocks.12/self_attn/Unsqueeze_12" Unsqueeze )/blocks.12/self_attn/Constant_35_output_0 /blocks.12/self_attn/Constant_35"Constant*H value*<B,/blocks.12/self_attn/Constant_35_attr::valueJ  &/blocks.12/self_attn/Gather_6_output_0 )/blocks.12/self_attn/Constant_35_output_0*/blocks.12/self_attn/Unsqueeze_13_output_0!/blocks.12/self_attn/Unsqueeze_13" Unsqueeze )/blocks.12/self_attn/Constant_36_output_0 /blocks.12/self_attn/Constant_36"Constant*H value*<B,/blocks.12/self_attn/Constant_36_attr::valueJ  &/blocks.12/self_attn/Gather_7_output_0 )/blocks.12/self_attn/Constant_36_output_0*/blocks.12/self_attn/Unsqueeze_14_output_0!/blocks.12/self_attn/Unsqueeze_14" Unsqueeze )/blocks.12/self_attn/Constant_37_output_0 /blocks.12/self_attn/Constant_37"Constant*H value*<B,/blocks.12/self_attn/Constant_37_attr::valueJ )/blocks.12/self_attn/Constant_38_output_0 /blocks.12/self_attn/Constant_38"Constant*H value*<B,/blocks.12/self_attn/Constant_38_attr::valueJ  &/blocks.12/self_attn/Gather_8_output_0 )/blocks.12/self_attn/Constant_38_output_0*/blocks.12/self_attn/Unsqueeze_15_output_0!/blocks.12/self_attn/Unsqueeze_15" Unsqueeze )/blocks.12/self_attn/Constant_39_output_0 /blocks.12/self_attn/Constant_39"Constant*H value*<B,/blocks.12/self_attn/Constant_39_attr::valueJ  &/blocks.12/self_attn/Gather_9_output_0 )/blocks.12/self_attn/Constant_39_output_0*/blocks.12/self_attn/Unsqueeze_16_output_0!/blocks.12/self_attn/Unsqueeze_16" Unsqueeze  */blocks.12/self_attn/Unsqueeze_13_output_0 */blocks.12/self_attn/Unsqueeze_14_output_0 )/blocks.12/self_attn/Constant_37_output_0 */blocks.12/self_attn/Unsqueeze_15_output_0 */blocks.12/self_attn/Unsqueeze_16_output_0&/blocks.12/self_attn/Concat_8_output_0/blocks.12/self_attn/Concat_8"Concat* axis )/blocks.12/self_attn/Constant_40_output_0 /blocks.12/self_attn/Constant_40"Constant*H value*<B,/blocks.12/self_attn/Constant_40_attr::valueJ  &/blocks.12/self_attn/Concat_8_output_0 )/blocks.12/self_attn/Constant_40_output_0'/blocks.12/self_attn/Reshape_3_output_0/blocks.12/self_attn/Reshape_3"Reshape* allowzero u '/blocks.12/self_attn/Reshape_3_output_0%/blocks.12/self_attn/Shape_8_output_0/blocks.12/self_attn/Shape_8"Shape  %/blocks.12/self_attn/Shape_8_output_0-/blocks.12/self_attn/ConstantOfShape_output_0$/blocks.12/self_attn/ConstantOfShape"ConstantOfShape*L value*@B0/blocks.12/self_attn/ConstantOfShape_attr::valueJ )/blocks.12/self_attn/Constant_41_output_0 /blocks.12/self_attn/Constant_41"Constant*F value*:B,/blocks.12/self_attn/Constant_41_attr::valueJ  -/blocks.12/self_attn/ConstantOfShape_output_0 )/blocks.12/self_attn/Constant_41_output_0#/blocks.12/self_attn/Mul_4_output_0/blocks.12/self_attn/Mul_4"Mul  '/blocks.12/self_attn/Reshape_3_output_0 #/blocks.12/self_attn/Mul_4_output_0#/blocks.12/self_attn/Equal_output_0/blocks.12/self_attn/Equal"Equal  #/blocks.12/self_attn/Equal_output_0 -/blocks.12/self_attn/ConstantOfShape_output_0 '/blocks.12/self_attn/Reshape_3_output_0#/blocks.12/self_attn/Where_output_0/blocks.12/self_attn/Where"Where  */blocks.12/self_attn/Unsqueeze_12_output_0 #/blocks.12/self_attn/Where_output_0$/blocks.12/self_attn/Expand_output_0/blocks.12/self_attn/Expand"Expand )/blocks.12/self_attn/Constant_42_output_0 /blocks.12/self_attn/Constant_42"Constant*F value*:B,/blocks.12/self_attn/Constant_42_attr::valueJ  &/blocks.12/self_attn/Gather_7_output_0 )/blocks.12/self_attn/Constant_42_output_0#/blocks.12/self_attn/Mul_5_output_0/blocks.12/self_attn/Mul_5"Mul fonnx::Unsqueeze_4024 Constant_5851"Constant*5 value*)BConstant_5851_attr::valueJ  &/blocks.12/self_attn/Gather_6_output_0 onnx::Unsqueeze_4024*/blocks.12/self_attn/Unsqueeze_17_output_0!/blocks.12/self_attn/Unsqueeze_17" Unsqueeze fonnx::Unsqueeze_4026 Constant_5853"Constant*5 value*)BConstant_5853_attr::valueJ  #/blocks.12/self_attn/Mul_5_output_0 onnx::Unsqueeze_4026*/blocks.12/self_attn/Unsqueeze_18_output_0!/blocks.12/self_attn/Unsqueeze_18" Unsqueeze fonnx::Unsqueeze_4028 Constant_5855"Constant*5 value*)BConstant_5855_attr::valueJ  &/blocks.12/self_attn/Gather_8_output_0 onnx::Unsqueeze_4028*/blocks.12/self_attn/Unsqueeze_19_output_0!/blocks.12/self_attn/Unsqueeze_19" Unsqueeze fonnx::Unsqueeze_4030 Constant_5857"Constant*5 value*)BConstant_5857_attr::valueJ  &/blocks.12/self_attn/Gather_9_output_0 onnx::Unsqueeze_4030*/blocks.12/self_attn/Unsqueeze_20_output_0!/blocks.12/self_attn/Unsqueeze_20" Unsqueeze  */blocks.12/self_attn/Unsqueeze_17_output_0 */blocks.12/self_attn/Unsqueeze_18_output_0 */blocks.12/self_attn/Unsqueeze_19_output_0 */blocks.12/self_attn/Unsqueeze_20_output_0&/blocks.12/self_attn/Concat_9_output_0/blocks.12/self_attn/Concat_9"Concat* axis  $/blocks.12/self_attn/Expand_output_0 &/blocks.12/self_attn/Concat_9_output_0'/blocks.12/self_attn/Reshape_4_output_0/blocks.12/self_attn/Reshape_4"Reshape* allowzero w )/blocks.12/self_attn/Transpose_2_output_0%/blocks.12/self_attn/Shape_9_output_0/blocks.12/self_attn/Shape_9"Shape )/blocks.12/self_attn/Constant_43_output_0 /blocks.12/self_attn/Constant_43"Constant*F value*:B,/blocks.12/self_attn/Constant_43_attr::valueJ  %/blocks.12/self_attn/Shape_9_output_0 )/blocks.12/self_attn/Constant_43_output_0'/blocks.12/self_attn/Gather_10_output_0/blocks.12/self_attn/Gather_10"Gather* axis y )/blocks.12/self_attn/Transpose_2_output_0&/blocks.12/self_attn/Shape_10_output_0/blocks.12/self_attn/Shape_10"Shape )/blocks.12/self_attn/Constant_44_output_0 /blocks.12/self_attn/Constant_44"Constant*F value*:B,/blocks.12/self_attn/Constant_44_attr::valueJ  &/blocks.12/self_attn/Shape_10_output_0 )/blocks.12/self_attn/Constant_44_output_0'/blocks.12/self_attn/Gather_11_output_0/blocks.12/self_attn/Gather_11"Gather* axis y )/blocks.12/self_attn/Transpose_2_output_0&/blocks.12/self_attn/Shape_11_output_0/blocks.12/self_attn/Shape_11"Shape )/blocks.12/self_attn/Constant_45_output_0 /blocks.12/self_attn/Constant_45"Constant*F value*:B,/blocks.12/self_attn/Constant_45_attr::valueJ  &/blocks.12/self_attn/Shape_11_output_0 )/blocks.12/self_attn/Constant_45_output_0'/blocks.12/self_attn/Gather_12_output_0/blocks.12/self_attn/Gather_12"Gather* axis y )/blocks.12/self_attn/Transpose_2_output_0&/blocks.12/self_attn/Shape_12_output_0/blocks.12/self_attn/Shape_12"Shape )/blocks.12/self_attn/Constant_46_output_0 /blocks.12/self_attn/Constant_46"Constant*F value*:B,/blocks.12/self_attn/Constant_46_attr::valueJ  &/blocks.12/self_attn/Shape_12_output_0 )/blocks.12/self_attn/Constant_46_output_0'/blocks.12/self_attn/Gather_13_output_0/blocks.12/self_attn/Gather_13"Gather* axis )/blocks.12/self_attn/Constant_47_output_0 /blocks.12/self_attn/Constant_47"Constant*H value*<B,/blocks.12/self_attn/Constant_47_attr::valueJ  )/blocks.12/self_attn/Transpose_2_output_0 )/blocks.12/self_attn/Constant_47_output_0*/blocks.12/self_attn/Unsqueeze_21_output_0!/blocks.12/self_attn/Unsqueeze_21" Unsqueeze )/blocks.12/self_attn/Constant_48_output_0 /blocks.12/self_attn/Constant_48"Constant*H value*<B,/blocks.12/self_attn/Constant_48_attr::valueJ  '/blocks.12/self_attn/Gather_10_output_0 )/blocks.12/self_attn/Constant_48_output_0*/blocks.12/self_attn/Unsqueeze_22_output_0!/blocks.12/self_attn/Unsqueeze_22" Unsqueeze )/blocks.12/self_attn/Constant_49_output_0 /blocks.12/self_attn/Constant_49"Constant*H value*<B,/blocks.12/self_attn/Constant_49_attr::valueJ  '/blocks.12/self_attn/Gather_11_output_0 )/blocks.12/self_attn/Constant_49_output_0*/blocks.12/self_attn/Unsqueeze_23_output_0!/blocks.12/self_attn/Unsqueeze_23" Unsqueeze )/blocks.12/self_attn/Constant_50_output_0 /blocks.12/self_attn/Constant_50"Constant*H value*<B,/blocks.12/self_attn/Constant_50_attr::valueJ )/blocks.12/self_attn/Constant_51_output_0 /blocks.12/self_attn/Constant_51"Constant*H value*<B,/blocks.12/self_attn/Constant_51_attr::valueJ  '/blocks.12/self_attn/Gather_12_output_0 )/blocks.12/self_attn/Constant_51_output_0*/blocks.12/self_attn/Unsqueeze_24_output_0!/blocks.12/self_attn/Unsqueeze_24" Unsqueeze )/blocks.12/self_attn/Constant_52_output_0 /blocks.12/self_attn/Constant_52"Constant*H value*<B,/blocks.12/self_attn/Constant_52_attr::valueJ  '/blocks.12/self_attn/Gather_13_output_0 )/blocks.12/self_attn/Constant_52_output_0*/blocks.12/self_attn/Unsqueeze_25_output_0!/blocks.12/self_attn/Unsqueeze_25" Unsqueeze  */blocks.12/self_attn/Unsqueeze_22_output_0 */blocks.12/self_attn/Unsqueeze_23_output_0 )/blocks.12/self_attn/Constant_50_output_0 */blocks.12/self_attn/Unsqueeze_24_output_0 */blocks.12/self_attn/Unsqueeze_25_output_0'/blocks.12/self_attn/Concat_10_output_0/blocks.12/self_attn/Concat_10"Concat* axis )/blocks.12/self_attn/Constant_53_output_0 /blocks.12/self_attn/Constant_53"Constant*H value*<B,/blocks.12/self_attn/Constant_53_attr::valueJ  '/blocks.12/self_attn/Concat_10_output_0 )/blocks.12/self_attn/Constant_53_output_0'/blocks.12/self_attn/Reshape_5_output_0/blocks.12/self_attn/Reshape_5"Reshape* allowzero w '/blocks.12/self_attn/Reshape_5_output_0&/blocks.12/self_attn/Shape_13_output_0/blocks.12/self_attn/Shape_13"Shape  &/blocks.12/self_attn/Shape_13_output_0//blocks.12/self_attn/ConstantOfShape_1_output_0&/blocks.12/self_attn/ConstantOfShape_1"ConstantOfShape*N value*BB2/blocks.12/self_attn/ConstantOfShape_1_attr::valueJ )/blocks.12/self_attn/Constant_54_output_0 /blocks.12/self_attn/Constant_54"Constant*F value*:B,/blocks.12/self_attn/Constant_54_attr::valueJ  //blocks.12/self_attn/ConstantOfShape_1_output_0 )/blocks.12/self_attn/Constant_54_output_0#/blocks.12/self_attn/Mul_6_output_0/blocks.12/self_attn/Mul_6"Mul  '/blocks.12/self_attn/Reshape_5_output_0 #/blocks.12/self_attn/Mul_6_output_0%/blocks.12/self_attn/Equal_1_output_0/blocks.12/self_attn/Equal_1"Equal  %/blocks.12/self_attn/Equal_1_output_0 //blocks.12/self_attn/ConstantOfShape_1_output_0 '/blocks.12/self_attn/Reshape_5_output_0%/blocks.12/self_attn/Where_1_output_0/blocks.12/self_attn/Where_1"Where  */blocks.12/self_attn/Unsqueeze_21_output_0 %/blocks.12/self_attn/Where_1_output_0&/blocks.12/self_attn/Expand_1_output_0/blocks.12/self_attn/Expand_1"Expand )/blocks.12/self_attn/Constant_55_output_0 /blocks.12/self_attn/Constant_55"Constant*F value*:B,/blocks.12/self_attn/Constant_55_attr::valueJ  '/blocks.12/self_attn/Gather_11_output_0 )/blocks.12/self_attn/Constant_55_output_0#/blocks.12/self_attn/Mul_7_output_0/blocks.12/self_attn/Mul_7"Mul fonnx::Unsqueeze_4070 Constant_5896"Constant*5 value*)BConstant_5896_attr::valueJ  '/blocks.12/self_attn/Gather_10_output_0 onnx::Unsqueeze_4070*/blocks.12/self_attn/Unsqueeze_26_output_0!/blocks.12/self_attn/Unsqueeze_26" Unsqueeze fonnx::Unsqueeze_4072 Constant_5898"Constant*5 value*)BConstant_5898_attr::valueJ  #/blocks.12/self_attn/Mul_7_output_0 onnx::Unsqueeze_4072*/blocks.12/self_attn/Unsqueeze_27_output_0!/blocks.12/self_attn/Unsqueeze_27" Unsqueeze fonnx::Unsqueeze_4074 Constant_5900"Constant*5 value*)BConstant_5900_attr::valueJ  '/blocks.12/self_attn/Gather_12_output_0 onnx::Unsqueeze_4074*/blocks.12/self_attn/Unsqueeze_28_output_0!/blocks.12/self_attn/Unsqueeze_28" Unsqueeze fonnx::Unsqueeze_4076 Constant_5902"Constant*5 value*)BConstant_5902_attr::valueJ  '/blocks.12/self_attn/Gather_13_output_0 onnx::Unsqueeze_4076*/blocks.12/self_attn/Unsqueeze_29_output_0!/blocks.12/self_attn/Unsqueeze_29" Unsqueeze  */blocks.12/self_attn/Unsqueeze_26_output_0 */blocks.12/self_attn/Unsqueeze_27_output_0 */blocks.12/self_attn/Unsqueeze_28_output_0 */blocks.12/self_attn/Unsqueeze_29_output_0'/blocks.12/self_attn/Concat_11_output_0/blocks.12/self_attn/Concat_11"Concat* axis  &/blocks.12/self_attn/Expand_1_output_0 '/blocks.12/self_attn/Concat_11_output_0'/blocks.12/self_attn/Reshape_6_output_0/blocks.12/self_attn/Reshape_6"Reshape* allowzero  '/blocks.12/self_attn/Transpose_output_0 '/blocks.12/self_attn/Reshape_4_output_0$/blocks.12/self_attn/MatMul_output_0/blocks.12/self_attn/MatMul"MatMul )/blocks.12/self_attn/Constant_56_output_0 /blocks.12/self_attn/Constant_56"Constant*B value*6B,/blocks.12/self_attn/Constant_56_attr::valueJ5A  $/blocks.12/self_attn/MatMul_output_0 )/blocks.12/self_attn/Constant_56_output_0#/blocks.12/self_attn/Div_2_output_0/blocks.12/self_attn/Div_2"Div { #/blocks.12/self_attn/Div_2_output_0 attention_mask#/blocks.12/self_attn/Add_2_output_0/blocks.12/self_attn/Add_2"Add  #/blocks.12/self_attn/Add_2_output_0%/blocks.12/self_attn/Softmax_output_0/blocks.12/self_attn/Softmax"Softmax* axis { %/blocks.12/self_attn/Softmax_output_0$/blocks.12/self_attn/Cast_4_output_0/blocks.12/self_attn/Cast_4"Cast* to  $/blocks.12/self_attn/Cast_4_output_0 '/blocks.12/self_attn/Reshape_6_output_0&/blocks.12/self_attn/MatMul_1_output_0/blocks.12/self_attn/MatMul_1"MatMul  &/blocks.12/self_attn/MatMul_1_output_0)/blocks.12/self_attn/Transpose_3_output_0 /blocks.12/self_attn/Transpose_3" Transpose* perm@@@@ fonnx::Unsqueeze_4088 Constant_5914"Constant*5 value*)BConstant_5914_attr::valueJ  $/blocks.12/self_attn/Gather_output_0 onnx::Unsqueeze_4088*/blocks.12/self_attn/Unsqueeze_30_output_0!/blocks.12/self_attn/Unsqueeze_30" Unsqueeze fonnx::Unsqueeze_4090 Constant_5916"Constant*5 value*)BConstant_5916_attr::valueJ  &/blocks.12/self_attn/Gather_1_output_0 onnx::Unsqueeze_4090*/blocks.12/self_attn/Unsqueeze_31_output_0!/blocks.12/self_attn/Unsqueeze_31" Unsqueeze )/blocks.12/self_attn/Constant_57_output_0 /blocks.12/self_attn/Constant_57"Constant*H value*<B,/blocks.12/self_attn/Constant_57_attr::valueJ  */blocks.12/self_attn/Unsqueeze_30_output_0 */blocks.12/self_attn/Unsqueeze_31_output_0 )/blocks.12/self_attn/Constant_57_output_0'/blocks.12/self_attn/Concat_12_output_0/blocks.12/self_attn/Concat_12"Concat* axis  )/blocks.12/self_attn/Transpose_3_output_0 '/blocks.12/self_attn/Concat_12_output_0'/blocks.12/self_attn/Reshape_7_output_0/blocks.12/self_attn/Reshape_7"Reshape* allowzero  '/blocks.12/self_attn/Reshape_7_output_0 onnx::MatMul_8925+/blocks.12/self_attn/o_proj/MatMul_output_0"/blocks.12/self_attn/o_proj/MatMul"MatMul  */blocks.12/input_layernorm/Cast_1_output_0 +/blocks.12/self_attn/o_proj/MatMul_output_0/blocks.12/Add_output_0/blocks.12/Add"Add  /blocks.12/Add_output_01/blocks.12/post_attention_layernorm/Cast_output_0(/blocks.12/post_attention_layernorm/Cast"Cast* to 5/blocks.12/post_attention_layernorm/Constant_output_0,/blocks.12/post_attention_layernorm/Constant"Constant*N value*BB8/blocks.12/post_attention_layernorm/Constant_attr::valueJ@  1/blocks.12/post_attention_layernorm/Cast_output_0 5/blocks.12/post_attention_layernorm/Constant_output_00/blocks.12/post_attention_layernorm/Pow_output_0'/blocks.12/post_attention_layernorm/Pow"Pow  0/blocks.12/post_attention_layernorm/Pow_output_07/blocks.12/post_attention_layernorm/ReduceMean_output_0./blocks.12/post_attention_layernorm/ReduceMean" ReduceMean* axes@* keepdims 7/blocks.12/post_attention_layernorm/Constant_1_output_0./blocks.12/post_attention_layernorm/Constant_1"Constant*P value*DB:/blocks.12/post_attention_layernorm/Constant_1_attr::valueJ75  7/blocks.12/post_attention_layernorm/ReduceMean_output_0 7/blocks.12/post_attention_layernorm/Constant_1_output_00/blocks.12/post_attention_layernorm/Add_output_0'/blocks.12/post_attention_layernorm/Add"Add  0/blocks.12/post_attention_layernorm/Add_output_01/blocks.12/post_attention_layernorm/Sqrt_output_0(/blocks.12/post_attention_layernorm/Sqrt"Sqrt 7/blocks.12/post_attention_layernorm/Constant_2_output_0./blocks.12/post_attention_layernorm/Constant_2"Constant*P value*DB:/blocks.12/post_attention_layernorm/Constant_2_attr::valueJ?  7/blocks.12/post_attention_layernorm/Constant_2_output_0 1/blocks.12/post_attention_layernorm/Sqrt_output_00/blocks.12/post_attention_layernorm/Div_output_0'/blocks.12/post_attention_layernorm/Div"Div  1/blocks.12/post_attention_layernorm/Cast_output_03/blocks.12/post_attention_layernorm/Cast_1_output_0*/blocks.12/post_attention_layernorm/Cast_1"Cast* to  3/blocks.12/post_attention_layernorm/Cast_1_output_0 0/blocks.12/post_attention_layernorm/Div_output_00/blocks.12/post_attention_layernorm/Mul_output_0'/blocks.12/post_attention_layernorm/Mul"Mul  0/blocks.12/post_attention_layernorm/Mul_output_0 )blocks.12.post_attention_layernorm.weight2/blocks.12/post_attention_layernorm/Mul_1_output_0)/blocks.12/post_attention_layernorm/Mul_1"Mul  2/blocks.12/post_attention_layernorm/Mul_1_output_03/blocks.12/post_attention_layernorm/Cast_2_output_0*/blocks.12/post_attention_layernorm/Cast_2"Cast* to  3/blocks.12/post_attention_layernorm/Cast_2_output_0 onnx::MatMul_8926(/blocks.12/mlp/gate_proj/MatMul_output_0/blocks.12/mlp/gate_proj/MatMul"MatMul z (/blocks.12/mlp/gate_proj/MatMul_output_0&/blocks.12/mlp/act_fn/Sigmoid_output_0/blocks.12/mlp/act_fn/Sigmoid"Sigmoid  (/blocks.12/mlp/gate_proj/MatMul_output_0 &/blocks.12/mlp/act_fn/Sigmoid_output_0"/blocks.12/mlp/act_fn/Mul_output_0/blocks.12/mlp/act_fn/Mul"Mul  3/blocks.12/post_attention_layernorm/Cast_2_output_0 onnx::MatMul_8927&/blocks.12/mlp/up_proj/MatMul_output_0/blocks.12/mlp/up_proj/MatMul"MatMul  "/blocks.12/mlp/act_fn/Mul_output_0 &/blocks.12/mlp/up_proj/MatMul_output_0/blocks.12/mlp/Mul_output_0/blocks.12/mlp/Mul"Mul  /blocks.12/mlp/Mul_output_0 onnx::MatMul_8928(/blocks.12/mlp/down_proj/MatMul_output_0/blocks.12/mlp/down_proj/MatMul"MatMul  3/blocks.12/post_attention_layernorm/Cast_1_output_0 (/blocks.12/mlp/down_proj/MatMul_output_0/blocks.12/Add_1_output_0/blocks.12/Add_1"Add `/Constant_6_output_0 /Constant_6"Constant*1 value*%B/Constant_6_attr::valueJ  ] past_key_values /Constant_6_output_0/Gather_13_output_0 /Gather_13"Gather* axis /blocks.13/Constant_output_0/blocks.13/Constant"Constant*K value*?B/blocks.13/Constant_attr::valueJ  /blocks.12/Add_1_output_0 /blocks.13/Constant_output_0/blocks.13/Reshape_output_0/blocks.13/Reshape"Reshape* allowzero y /blocks.13/Reshape_output_0(/blocks.13/input_layernorm/Cast_output_0/blocks.13/input_layernorm/Cast"Cast* to ,/blocks.13/input_layernorm/Constant_output_0#/blocks.13/input_layernorm/Constant"Constant*E value*9B//blocks.13/input_layernorm/Constant_attr::valueJ@  (/blocks.13/input_layernorm/Cast_output_0 ,/blocks.13/input_layernorm/Constant_output_0'/blocks.13/input_layernorm/Pow_output_0/blocks.13/input_layernorm/Pow"Pow  '/blocks.13/input_layernorm/Pow_output_0./blocks.13/input_layernorm/ReduceMean_output_0%/blocks.13/input_layernorm/ReduceMean" ReduceMean* axes@* keepdims ./blocks.13/input_layernorm/Constant_1_output_0%/blocks.13/input_layernorm/Constant_1"Constant*G value*;B1/blocks.13/input_layernorm/Constant_1_attr::valueJ75  ./blocks.13/input_layernorm/ReduceMean_output_0 ./blocks.13/input_layernorm/Constant_1_output_0'/blocks.13/input_layernorm/Add_output_0/blocks.13/input_layernorm/Add"Add z '/blocks.13/input_layernorm/Add_output_0(/blocks.13/input_layernorm/Sqrt_output_0/blocks.13/input_layernorm/Sqrt"Sqrt ./blocks.13/input_layernorm/Constant_2_output_0%/blocks.13/input_layernorm/Constant_2"Constant*G value*;B1/blocks.13/input_layernorm/Constant_2_attr::valueJ?  ./blocks.13/input_layernorm/Constant_2_output_0 (/blocks.13/input_layernorm/Sqrt_output_0'/blocks.13/input_layernorm/Div_output_0/blocks.13/input_layernorm/Div"Div  (/blocks.13/input_layernorm/Cast_output_0*/blocks.13/input_layernorm/Cast_1_output_0!/blocks.13/input_layernorm/Cast_1"Cast* to  */blocks.13/input_layernorm/Cast_1_output_0 '/blocks.13/input_layernorm/Div_output_0'/blocks.13/input_layernorm/Mul_output_0/blocks.13/input_layernorm/Mul"Mul  '/blocks.13/input_layernorm/Mul_output_0 blocks.13.input_layernorm.weight)/blocks.13/input_layernorm/Mul_1_output_0 /blocks.13/input_layernorm/Mul_1"Mul  )/blocks.13/input_layernorm/Mul_1_output_0*/blocks.13/input_layernorm/Cast_2_output_0!/blocks.13/input_layernorm/Cast_2"Cast* to t */blocks.13/input_layernorm/Cast_2_output_0#/blocks.13/self_attn/Shape_output_0/blocks.13/self_attn/Shape"Shape &/blocks.13/self_attn/Constant_output_0/blocks.13/self_attn/Constant"Constant*C value*7B)/blocks.13/self_attn/Constant_attr::valueJ  #/blocks.13/self_attn/Shape_output_0 &/blocks.13/self_attn/Constant_output_0$/blocks.13/self_attn/Gather_output_0/blocks.13/self_attn/Gather"Gather* axis x */blocks.13/input_layernorm/Cast_2_output_0%/blocks.13/self_attn/Shape_1_output_0/blocks.13/self_attn/Shape_1"Shape (/blocks.13/self_attn/Constant_1_output_0/blocks.13/self_attn/Constant_1"Constant*E value*9B+/blocks.13/self_attn/Constant_1_attr::valueJ  %/blocks.13/self_attn/Shape_1_output_0 (/blocks.13/self_attn/Constant_1_output_0&/blocks.13/self_attn/Gather_1_output_0/blocks.13/self_attn/Gather_1"Gather* axis  */blocks.13/input_layernorm/Cast_2_output_0 onnx::MatMul_8929+/blocks.13/self_attn/q_proj/MatMul_output_0"/blocks.13/self_attn/q_proj/MatMul"MatMul  */blocks.13/input_layernorm/Cast_2_output_0 onnx::MatMul_8930+/blocks.13/self_attn/k_proj/MatMul_output_0"/blocks.13/self_attn/k_proj/MatMul"MatMul  */blocks.13/input_layernorm/Cast_2_output_0 onnx::MatMul_8931+/blocks.13/self_attn/v_proj/MatMul_output_0"/blocks.13/self_attn/v_proj/MatMul"MatMul fonnx::Unsqueeze_4151 Constant_5969"Constant*5 value*)BConstant_5969_attr::valueJ  $/blocks.13/self_attn/Gather_output_0 onnx::Unsqueeze_4151'/blocks.13/self_attn/Unsqueeze_output_0/blocks.13/self_attn/Unsqueeze" Unsqueeze fonnx::Unsqueeze_4153 Constant_5971"Constant*5 value*)BConstant_5971_attr::valueJ  &/blocks.13/self_attn/Gather_1_output_0 onnx::Unsqueeze_4153)/blocks.13/self_attn/Unsqueeze_1_output_0 /blocks.13/self_attn/Unsqueeze_1" Unsqueeze (/blocks.13/self_attn/Constant_2_output_0/blocks.13/self_attn/Constant_2"Constant*G value*;B+/blocks.13/self_attn/Constant_2_attr::valueJ (/blocks.13/self_attn/Constant_3_output_0/blocks.13/self_attn/Constant_3"Constant*G value*;B+/blocks.13/self_attn/Constant_3_attr::valueJ  '/blocks.13/self_attn/Unsqueeze_output_0 )/blocks.13/self_attn/Unsqueeze_1_output_0 (/blocks.13/self_attn/Constant_2_output_0 (/blocks.13/self_attn/Constant_3_output_0$/blocks.13/self_attn/Concat_output_0/blocks.13/self_attn/Concat"Concat* axis  +/blocks.13/self_attn/q_proj/MatMul_output_0 $/blocks.13/self_attn/Concat_output_0%/blocks.13/self_attn/Reshape_output_0/blocks.13/self_attn/Reshape"Reshape* allowzero fonnx::Unsqueeze_4161 Constant_5977"Constant*5 value*)BConstant_5977_attr::valueJ  $/blocks.13/self_attn/Gather_output_0 onnx::Unsqueeze_4161)/blocks.13/self_attn/Unsqueeze_2_output_0 /blocks.13/self_attn/Unsqueeze_2" Unsqueeze fonnx::Unsqueeze_4163 Constant_5979"Constant*5 value*)BConstant_5979_attr::valueJ  &/blocks.13/self_attn/Gather_1_output_0 onnx::Unsqueeze_4163)/blocks.13/self_attn/Unsqueeze_3_output_0 /blocks.13/self_attn/Unsqueeze_3" Unsqueeze (/blocks.13/self_attn/Constant_4_output_0/blocks.13/self_attn/Constant_4"Constant*G value*;B+/blocks.13/self_attn/Constant_4_attr::valueJ (/blocks.13/self_attn/Constant_5_output_0/blocks.13/self_attn/Constant_5"Constant*G value*;B+/blocks.13/self_attn/Constant_5_attr::valueJ  )/blocks.13/self_attn/Unsqueeze_2_output_0 )/blocks.13/self_attn/Unsqueeze_3_output_0 (/blocks.13/self_attn/Constant_4_output_0 (/blocks.13/self_attn/Constant_5_output_0&/blocks.13/self_attn/Concat_1_output_0/blocks.13/self_attn/Concat_1"Concat* axis fonnx::Unsqueeze_4170 Constant_5984"Constant*5 value*)BConstant_5984_attr::valueJ  $/blocks.13/self_attn/Gather_output_0 onnx::Unsqueeze_4170)/blocks.13/self_attn/Unsqueeze_4_output_0 /blocks.13/self_attn/Unsqueeze_4" Unsqueeze fonnx::Unsqueeze_4172 Constant_5986"Constant*5 value*)BConstant_5986_attr::valueJ  &/blocks.13/self_attn/Gather_1_output_0 onnx::Unsqueeze_4172)/blocks.13/self_attn/Unsqueeze_5_output_0 /blocks.13/self_attn/Unsqueeze_5" Unsqueeze (/blocks.13/self_attn/Constant_6_output_0/blocks.13/self_attn/Constant_6"Constant*G value*;B+/blocks.13/self_attn/Constant_6_attr::valueJ (/blocks.13/self_attn/Constant_7_output_0/blocks.13/self_attn/Constant_7"Constant*G value*;B+/blocks.13/self_attn/Constant_7_attr::valueJ  )/blocks.13/self_attn/Unsqueeze_4_output_0 )/blocks.13/self_attn/Unsqueeze_5_output_0 (/blocks.13/self_attn/Constant_6_output_0 (/blocks.13/self_attn/Constant_7_output_0&/blocks.13/self_attn/Concat_2_output_0/blocks.13/self_attn/Concat_2"Concat* axis  +/blocks.13/self_attn/k_proj/MatMul_output_0 &/blocks.13/self_attn/Concat_1_output_0'/blocks.13/self_attn/Reshape_1_output_0/blocks.13/self_attn/Reshape_1"Reshape* allowzero  +/blocks.13/self_attn/v_proj/MatMul_output_0 &/blocks.13/self_attn/Concat_2_output_0'/blocks.13/self_attn/Reshape_2_output_0/blocks.13/self_attn/Reshape_2"Reshape* allowzero  %/blocks.13/self_attn/Reshape_output_0)/blocks.13/self_attn/q_norm/Cast_output_0 /blocks.13/self_attn/q_norm/Cast"Cast* to -/blocks.13/self_attn/q_norm/Constant_output_0$/blocks.13/self_attn/q_norm/Constant"Constant*F value*:B0/blocks.13/self_attn/q_norm/Constant_attr::valueJ@  )/blocks.13/self_attn/q_norm/Cast_output_0 -/blocks.13/self_attn/q_norm/Constant_output_0(/blocks.13/self_attn/q_norm/Pow_output_0/blocks.13/self_attn/q_norm/Pow"Pow  (/blocks.13/self_attn/q_norm/Pow_output_0//blocks.13/self_attn/q_norm/ReduceMean_output_0&/blocks.13/self_attn/q_norm/ReduceMean" ReduceMean* axes@* keepdims //blocks.13/self_attn/q_norm/Constant_1_output_0&/blocks.13/self_attn/q_norm/Constant_1"Constant*H value*<B2/blocks.13/self_attn/q_norm/Constant_1_attr::valueJ75  //blocks.13/self_attn/q_norm/ReduceMean_output_0 //blocks.13/self_attn/q_norm/Constant_1_output_0(/blocks.13/self_attn/q_norm/Add_output_0/blocks.13/self_attn/q_norm/Add"Add } (/blocks.13/self_attn/q_norm/Add_output_0)/blocks.13/self_attn/q_norm/Sqrt_output_0 /blocks.13/self_attn/q_norm/Sqrt"Sqrt //blocks.13/self_attn/q_norm/Constant_2_output_0&/blocks.13/self_attn/q_norm/Constant_2"Constant*H value*<B2/blocks.13/self_attn/q_norm/Constant_2_attr::valueJ?  //blocks.13/self_attn/q_norm/Constant_2_output_0 )/blocks.13/self_attn/q_norm/Sqrt_output_0(/blocks.13/self_attn/q_norm/Div_output_0/blocks.13/self_attn/q_norm/Div"Div  )/blocks.13/self_attn/q_norm/Cast_output_0+/blocks.13/self_attn/q_norm/Cast_1_output_0"/blocks.13/self_attn/q_norm/Cast_1"Cast* to  +/blocks.13/self_attn/q_norm/Cast_1_output_0 (/blocks.13/self_attn/q_norm/Div_output_0(/blocks.13/self_attn/q_norm/Mul_output_0/blocks.13/self_attn/q_norm/Mul"Mul  (/blocks.13/self_attn/q_norm/Mul_output_0 !blocks.13.self_attn.q_norm.weight*/blocks.13/self_attn/q_norm/Mul_1_output_0!/blocks.13/self_attn/q_norm/Mul_1"Mul  */blocks.13/self_attn/q_norm/Mul_1_output_0+/blocks.13/self_attn/q_norm/Cast_2_output_0"/blocks.13/self_attn/q_norm/Cast_2"Cast* to  '/blocks.13/self_attn/Reshape_1_output_0)/blocks.13/self_attn/k_norm/Cast_output_0 /blocks.13/self_attn/k_norm/Cast"Cast* to -/blocks.13/self_attn/k_norm/Constant_output_0$/blocks.13/self_attn/k_norm/Constant"Constant*F value*:B0/blocks.13/self_attn/k_norm/Constant_attr::valueJ@  )/blocks.13/self_attn/k_norm/Cast_output_0 -/blocks.13/self_attn/k_norm/Constant_output_0(/blocks.13/self_attn/k_norm/Pow_output_0/blocks.13/self_attn/k_norm/Pow"Pow  (/blocks.13/self_attn/k_norm/Pow_output_0//blocks.13/self_attn/k_norm/ReduceMean_output_0&/blocks.13/self_attn/k_norm/ReduceMean" ReduceMean* axes@* keepdims //blocks.13/self_attn/k_norm/Constant_1_output_0&/blocks.13/self_attn/k_norm/Constant_1"Constant*H value*<B2/blocks.13/self_attn/k_norm/Constant_1_attr::valueJ75  //blocks.13/self_attn/k_norm/ReduceMean_output_0 //blocks.13/self_attn/k_norm/Constant_1_output_0(/blocks.13/self_attn/k_norm/Add_output_0/blocks.13/self_attn/k_norm/Add"Add } (/blocks.13/self_attn/k_norm/Add_output_0)/blocks.13/self_attn/k_norm/Sqrt_output_0 /blocks.13/self_attn/k_norm/Sqrt"Sqrt //blocks.13/self_attn/k_norm/Constant_2_output_0&/blocks.13/self_attn/k_norm/Constant_2"Constant*H value*<B2/blocks.13/self_attn/k_norm/Constant_2_attr::valueJ?  //blocks.13/self_attn/k_norm/Constant_2_output_0 )/blocks.13/self_attn/k_norm/Sqrt_output_0(/blocks.13/self_attn/k_norm/Div_output_0/blocks.13/self_attn/k_norm/Div"Div  )/blocks.13/self_attn/k_norm/Cast_output_0+/blocks.13/self_attn/k_norm/Cast_1_output_0"/blocks.13/self_attn/k_norm/Cast_1"Cast* to  +/blocks.13/self_attn/k_norm/Cast_1_output_0 (/blocks.13/self_attn/k_norm/Div_output_0(/blocks.13/self_attn/k_norm/Mul_output_0/blocks.13/self_attn/k_norm/Mul"Mul  (/blocks.13/self_attn/k_norm/Mul_output_0 !blocks.13.self_attn.k_norm.weight*/blocks.13/self_attn/k_norm/Mul_1_output_0!/blocks.13/self_attn/k_norm/Mul_1"Mul  */blocks.13/self_attn/k_norm/Mul_1_output_0+/blocks.13/self_attn/k_norm/Cast_2_output_0"/blocks.13/self_attn/k_norm/Cast_2"Cast* to  +/blocks.13/self_attn/q_norm/Cast_2_output_0 %/blocks.0/self_attn/Gather_2_output_0!/blocks.13/self_attn/Mul_output_0/blocks.13/self_attn/Mul"Mul y +/blocks.13/self_attn/q_norm/Cast_2_output_0%/blocks.13/self_attn/Shape_2_output_0/blocks.13/self_attn/Shape_2"Shape (/blocks.13/self_attn/Constant_8_output_0/blocks.13/self_attn/Constant_8"Constant*E value*9B+/blocks.13/self_attn/Constant_8_attr::valueJ  %/blocks.13/self_attn/Shape_2_output_0 (/blocks.13/self_attn/Constant_8_output_0&/blocks.13/self_attn/Gather_2_output_0/blocks.13/self_attn/Gather_2"Gather* axis (/blocks.13/self_attn/Constant_9_output_0/blocks.13/self_attn/Constant_9"Constant*E value*9B+/blocks.13/self_attn/Constant_9_attr::valueJ  &/blocks.13/self_attn/Gather_2_output_0 (/blocks.13/self_attn/Constant_9_output_0!/blocks.13/self_attn/Div_output_0/blocks.13/self_attn/Div"Div s !/blocks.13/self_attn/Div_output_0"/blocks.13/self_attn/Cast_output_0/blocks.13/self_attn/Cast"Cast* to x "/blocks.13/self_attn/Cast_output_0$/blocks.13/self_attn/Cast_1_output_0/blocks.13/self_attn/Cast_1"Cast* to )/blocks.13/self_attn/Constant_10_output_0 /blocks.13/self_attn/Constant_10"Constant*H value*<B,/blocks.13/self_attn/Constant_10_attr::valueJ )/blocks.13/self_attn/Constant_11_output_0 /blocks.13/self_attn/Constant_11"Constant*H value*<B,/blocks.13/self_attn/Constant_11_attr::valueJ )/blocks.13/self_attn/Constant_12_output_0 /blocks.13/self_attn/Constant_12"Constant*H value*<B,/blocks.13/self_attn/Constant_12_attr::valueJ  $/blocks.13/self_attn/Cast_1_output_0 )/blocks.13/self_attn/Constant_12_output_0)/blocks.13/self_attn/Unsqueeze_6_output_0 /blocks.13/self_attn/Unsqueeze_6" Unsqueeze )/blocks.13/self_attn/Constant_13_output_0 /blocks.13/self_attn/Constant_13"Constant*H value*<B,/blocks.13/self_attn/Constant_13_attr::valueJ  +/blocks.13/self_attn/q_norm/Cast_2_output_0 )/blocks.13/self_attn/Constant_11_output_0 )/blocks.13/self_attn/Unsqueeze_6_output_0 )/blocks.13/self_attn/Constant_10_output_0 )/blocks.13/self_attn/Constant_13_output_0#/blocks.13/self_attn/Slice_output_0/blocks.13/self_attn/Slice"Slice )/blocks.13/self_attn/Constant_14_output_0 /blocks.13/self_attn/Constant_14"Constant*H value*<B,/blocks.13/self_attn/Constant_14_attr::valueJ )/blocks.13/self_attn/Constant_15_output_0 /blocks.13/self_attn/Constant_15"Constant*H value*<B,/blocks.13/self_attn/Constant_15_attr::valueJ  $/blocks.13/self_attn/Cast_1_output_0 )/blocks.13/self_attn/Constant_15_output_0)/blocks.13/self_attn/Unsqueeze_7_output_0 /blocks.13/self_attn/Unsqueeze_7" Unsqueeze )/blocks.13/self_attn/Constant_16_output_0 /blocks.13/self_attn/Constant_16"Constant*H value*<B,/blocks.13/self_attn/Constant_16_attr::valueJ )/blocks.13/self_attn/Constant_17_output_0 /blocks.13/self_attn/Constant_17"Constant*H value*<B,/blocks.13/self_attn/Constant_17_attr::valueJ  +/blocks.13/self_attn/q_norm/Cast_2_output_0 )/blocks.13/self_attn/Unsqueeze_7_output_0 )/blocks.13/self_attn/Constant_16_output_0 )/blocks.13/self_attn/Constant_14_output_0 )/blocks.13/self_attn/Constant_17_output_0%/blocks.13/self_attn/Slice_1_output_0/blocks.13/self_attn/Slice_1"Slice i %/blocks.13/self_attn/Slice_1_output_0!/blocks.13/self_attn/Neg_output_0/blocks.13/self_attn/Neg"Neg  !/blocks.13/self_attn/Neg_output_0 #/blocks.13/self_attn/Slice_output_0&/blocks.13/self_attn/Concat_3_output_0/blocks.13/self_attn/Concat_3"Concat* axis  &/blocks.13/self_attn/Concat_3_output_0 %/blocks.0/self_attn/Gather_3_output_0#/blocks.13/self_attn/Mul_1_output_0/blocks.13/self_attn/Mul_1"Mul  !/blocks.13/self_attn/Mul_output_0 #/blocks.13/self_attn/Mul_1_output_0!/blocks.13/self_attn/Add_output_0/blocks.13/self_attn/Add"Add  +/blocks.13/self_attn/k_norm/Cast_2_output_0 %/blocks.0/self_attn/Gather_2_output_0#/blocks.13/self_attn/Mul_2_output_0/blocks.13/self_attn/Mul_2"Mul y +/blocks.13/self_attn/k_norm/Cast_2_output_0%/blocks.13/self_attn/Shape_3_output_0/blocks.13/self_attn/Shape_3"Shape )/blocks.13/self_attn/Constant_18_output_0 /blocks.13/self_attn/Constant_18"Constant*F value*:B,/blocks.13/self_attn/Constant_18_attr::valueJ  %/blocks.13/self_attn/Shape_3_output_0 )/blocks.13/self_attn/Constant_18_output_0&/blocks.13/self_attn/Gather_3_output_0/blocks.13/self_attn/Gather_3"Gather* axis )/blocks.13/self_attn/Constant_19_output_0 /blocks.13/self_attn/Constant_19"Constant*F value*:B,/blocks.13/self_attn/Constant_19_attr::valueJ  &/blocks.13/self_attn/Gather_3_output_0 )/blocks.13/self_attn/Constant_19_output_0#/blocks.13/self_attn/Div_1_output_0/blocks.13/self_attn/Div_1"Div y #/blocks.13/self_attn/Div_1_output_0$/blocks.13/self_attn/Cast_2_output_0/blocks.13/self_attn/Cast_2"Cast* to z $/blocks.13/self_attn/Cast_2_output_0$/blocks.13/self_attn/Cast_3_output_0/blocks.13/self_attn/Cast_3"Cast* to )/blocks.13/self_attn/Constant_20_output_0 /blocks.13/self_attn/Constant_20"Constant*H value*<B,/blocks.13/self_attn/Constant_20_attr::valueJ )/blocks.13/self_attn/Constant_21_output_0 /blocks.13/self_attn/Constant_21"Constant*H value*<B,/blocks.13/self_attn/Constant_21_attr::valueJ )/blocks.13/self_attn/Constant_22_output_0 /blocks.13/self_attn/Constant_22"Constant*H value*<B,/blocks.13/self_attn/Constant_22_attr::valueJ  $/blocks.13/self_attn/Cast_3_output_0 )/blocks.13/self_attn/Constant_22_output_0)/blocks.13/self_attn/Unsqueeze_8_output_0 /blocks.13/self_attn/Unsqueeze_8" Unsqueeze )/blocks.13/self_attn/Constant_23_output_0 /blocks.13/self_attn/Constant_23"Constant*H value*<B,/blocks.13/self_attn/Constant_23_attr::valueJ  +/blocks.13/self_attn/k_norm/Cast_2_output_0 )/blocks.13/self_attn/Constant_21_output_0 )/blocks.13/self_attn/Unsqueeze_8_output_0 )/blocks.13/self_attn/Constant_20_output_0 )/blocks.13/self_attn/Constant_23_output_0%/blocks.13/self_attn/Slice_2_output_0/blocks.13/self_attn/Slice_2"Slice )/blocks.13/self_attn/Constant_24_output_0 /blocks.13/self_attn/Constant_24"Constant*H value*<B,/blocks.13/self_attn/Constant_24_attr::valueJ )/blocks.13/self_attn/Constant_25_output_0 /blocks.13/self_attn/Constant_25"Constant*H value*<B,/blocks.13/self_attn/Constant_25_attr::valueJ  $/blocks.13/self_attn/Cast_3_output_0 )/blocks.13/self_attn/Constant_25_output_0)/blocks.13/self_attn/Unsqueeze_9_output_0 /blocks.13/self_attn/Unsqueeze_9" Unsqueeze )/blocks.13/self_attn/Constant_26_output_0 /blocks.13/self_attn/Constant_26"Constant*H value*<B,/blocks.13/self_attn/Constant_26_attr::valueJ )/blocks.13/self_attn/Constant_27_output_0 /blocks.13/self_attn/Constant_27"Constant*H value*<B,/blocks.13/self_attn/Constant_27_attr::valueJ  +/blocks.13/self_attn/k_norm/Cast_2_output_0 )/blocks.13/self_attn/Unsqueeze_9_output_0 )/blocks.13/self_attn/Constant_26_output_0 )/blocks.13/self_attn/Constant_24_output_0 )/blocks.13/self_attn/Constant_27_output_0%/blocks.13/self_attn/Slice_3_output_0/blocks.13/self_attn/Slice_3"Slice m %/blocks.13/self_attn/Slice_3_output_0#/blocks.13/self_attn/Neg_1_output_0/blocks.13/self_attn/Neg_1"Neg  #/blocks.13/self_attn/Neg_1_output_0 %/blocks.13/self_attn/Slice_2_output_0&/blocks.13/self_attn/Concat_4_output_0/blocks.13/self_attn/Concat_4"Concat* axis  &/blocks.13/self_attn/Concat_4_output_0 %/blocks.0/self_attn/Gather_3_output_0#/blocks.13/self_attn/Mul_3_output_0/blocks.13/self_attn/Mul_3"Mul  #/blocks.13/self_attn/Mul_2_output_0 #/blocks.13/self_attn/Mul_3_output_0#/blocks.13/self_attn/Add_1_output_0/blocks.13/self_attn/Add_1"Add  /Gather_13_output_0 /rotary/Constant_3_output_0&/blocks.13/self_attn/Gather_4_output_0/blocks.13/self_attn/Gather_4"Gather* axis  /Gather_13_output_0 /rotary/Constant_8_output_0&/blocks.13/self_attn/Gather_5_output_0/blocks.13/self_attn/Gather_5"Gather* axis  &/blocks.13/self_attn/Gather_4_output_0 #/blocks.13/self_attn/Add_1_output_0&/blocks.13/self_attn/Concat_5_output_0/blocks.13/self_attn/Concat_5"Concat* axis  &/blocks.13/self_attn/Gather_5_output_0 '/blocks.13/self_attn/Reshape_2_output_0&/blocks.13/self_attn/Concat_6_output_0/blocks.13/self_attn/Concat_6"Concat* axis )/blocks.13/self_attn/Constant_28_output_0 /blocks.13/self_attn/Constant_28"Constant*H value*<B,/blocks.13/self_attn/Constant_28_attr::valueJ  &/blocks.13/self_attn/Concat_5_output_0 )/blocks.13/self_attn/Constant_28_output_0*/blocks.13/self_attn/Unsqueeze_10_output_0!/blocks.13/self_attn/Unsqueeze_10" Unsqueeze )/blocks.13/self_attn/Constant_29_output_0 /blocks.13/self_attn/Constant_29"Constant*H value*<B,/blocks.13/self_attn/Constant_29_attr::valueJ  &/blocks.13/self_attn/Concat_6_output_0 )/blocks.13/self_attn/Constant_29_output_0*/blocks.13/self_attn/Unsqueeze_11_output_0!/blocks.13/self_attn/Unsqueeze_11" Unsqueeze  */blocks.13/self_attn/Unsqueeze_10_output_0 */blocks.13/self_attn/Unsqueeze_11_output_0&/blocks.13/self_attn/Concat_7_output_0/blocks.13/self_attn/Concat_7"Concat* axis  !/blocks.13/self_attn/Add_output_0'/blocks.13/self_attn/Transpose_output_0/blocks.13/self_attn/Transpose" Transpose* perm@@@@  &/blocks.13/self_attn/Concat_5_output_0)/blocks.13/self_attn/Transpose_1_output_0 /blocks.13/self_attn/Transpose_1" Transpose* perm@@@@  &/blocks.13/self_attn/Concat_6_output_0)/blocks.13/self_attn/Transpose_2_output_0 /blocks.13/self_attn/Transpose_2" Transpose* perm@@@@ w )/blocks.13/self_attn/Transpose_1_output_0%/blocks.13/self_attn/Shape_4_output_0/blocks.13/self_attn/Shape_4"Shape )/blocks.13/self_attn/Constant_30_output_0 /blocks.13/self_attn/Constant_30"Constant*F value*:B,/blocks.13/self_attn/Constant_30_attr::valueJ  %/blocks.13/self_attn/Shape_4_output_0 )/blocks.13/self_attn/Constant_30_output_0&/blocks.13/self_attn/Gather_6_output_0/blocks.13/self_attn/Gather_6"Gather* axis w )/blocks.13/self_attn/Transpose_1_output_0%/blocks.13/self_attn/Shape_5_output_0/blocks.13/self_attn/Shape_5"Shape )/blocks.13/self_attn/Constant_31_output_0 /blocks.13/self_attn/Constant_31"Constant*F value*:B,/blocks.13/self_attn/Constant_31_attr::valueJ  %/blocks.13/self_attn/Shape_5_output_0 )/blocks.13/self_attn/Constant_31_output_0&/blocks.13/self_attn/Gather_7_output_0/blocks.13/self_attn/Gather_7"Gather* axis w )/blocks.13/self_attn/Transpose_1_output_0%/blocks.13/self_attn/Shape_6_output_0/blocks.13/self_attn/Shape_6"Shape )/blocks.13/self_attn/Constant_32_output_0 /blocks.13/self_attn/Constant_32"Constant*F value*:B,/blocks.13/self_attn/Constant_32_attr::valueJ  %/blocks.13/self_attn/Shape_6_output_0 )/blocks.13/self_attn/Constant_32_output_0&/blocks.13/self_attn/Gather_8_output_0/blocks.13/self_attn/Gather_8"Gather* axis w )/blocks.13/self_attn/Transpose_1_output_0%/blocks.13/self_attn/Shape_7_output_0/blocks.13/self_attn/Shape_7"Shape )/blocks.13/self_attn/Constant_33_output_0 /blocks.13/self_attn/Constant_33"Constant*F value*:B,/blocks.13/self_attn/Constant_33_attr::valueJ  %/blocks.13/self_attn/Shape_7_output_0 )/blocks.13/self_attn/Constant_33_output_0&/blocks.13/self_attn/Gather_9_output_0/blocks.13/self_attn/Gather_9"Gather* axis )/blocks.13/self_attn/Constant_34_output_0 /blocks.13/self_attn/Constant_34"Constant*H value*<B,/blocks.13/self_attn/Constant_34_attr::valueJ  )/blocks.13/self_attn/Transpose_1_output_0 )/blocks.13/self_attn/Constant_34_output_0*/blocks.13/self_attn/Unsqueeze_12_output_0!/blocks.13/self_attn/Unsqueeze_12" Unsqueeze )/blocks.13/self_attn/Constant_35_output_0 /blocks.13/self_attn/Constant_35"Constant*H value*<B,/blocks.13/self_attn/Constant_35_attr::valueJ  &/blocks.13/self_attn/Gather_6_output_0 )/blocks.13/self_attn/Constant_35_output_0*/blocks.13/self_attn/Unsqueeze_13_output_0!/blocks.13/self_attn/Unsqueeze_13" Unsqueeze )/blocks.13/self_attn/Constant_36_output_0 /blocks.13/self_attn/Constant_36"Constant*H value*<B,/blocks.13/self_attn/Constant_36_attr::valueJ  &/blocks.13/self_attn/Gather_7_output_0 )/blocks.13/self_attn/Constant_36_output_0*/blocks.13/self_attn/Unsqueeze_14_output_0!/blocks.13/self_attn/Unsqueeze_14" Unsqueeze )/blocks.13/self_attn/Constant_37_output_0 /blocks.13/self_attn/Constant_37"Constant*H value*<B,/blocks.13/self_attn/Constant_37_attr::valueJ )/blocks.13/self_attn/Constant_38_output_0 /blocks.13/self_attn/Constant_38"Constant*H value*<B,/blocks.13/self_attn/Constant_38_attr::valueJ  &/blocks.13/self_attn/Gather_8_output_0 )/blocks.13/self_attn/Constant_38_output_0*/blocks.13/self_attn/Unsqueeze_15_output_0!/blocks.13/self_attn/Unsqueeze_15" Unsqueeze )/blocks.13/self_attn/Constant_39_output_0 /blocks.13/self_attn/Constant_39"Constant*H value*<B,/blocks.13/self_attn/Constant_39_attr::valueJ  &/blocks.13/self_attn/Gather_9_output_0 )/blocks.13/self_attn/Constant_39_output_0*/blocks.13/self_attn/Unsqueeze_16_output_0!/blocks.13/self_attn/Unsqueeze_16" Unsqueeze  */blocks.13/self_attn/Unsqueeze_13_output_0 */blocks.13/self_attn/Unsqueeze_14_output_0 )/blocks.13/self_attn/Constant_37_output_0 */blocks.13/self_attn/Unsqueeze_15_output_0 */blocks.13/self_attn/Unsqueeze_16_output_0&/blocks.13/self_attn/Concat_8_output_0/blocks.13/self_attn/Concat_8"Concat* axis )/blocks.13/self_attn/Constant_40_output_0 /blocks.13/self_attn/Constant_40"Constant*H value*<B,/blocks.13/self_attn/Constant_40_attr::valueJ  &/blocks.13/self_attn/Concat_8_output_0 )/blocks.13/self_attn/Constant_40_output_0'/blocks.13/self_attn/Reshape_3_output_0/blocks.13/self_attn/Reshape_3"Reshape* allowzero u '/blocks.13/self_attn/Reshape_3_output_0%/blocks.13/self_attn/Shape_8_output_0/blocks.13/self_attn/Shape_8"Shape  %/blocks.13/self_attn/Shape_8_output_0-/blocks.13/self_attn/ConstantOfShape_output_0$/blocks.13/self_attn/ConstantOfShape"ConstantOfShape*L value*@B0/blocks.13/self_attn/ConstantOfShape_attr::valueJ )/blocks.13/self_attn/Constant_41_output_0 /blocks.13/self_attn/Constant_41"Constant*F value*:B,/blocks.13/self_attn/Constant_41_attr::valueJ  -/blocks.13/self_attn/ConstantOfShape_output_0 )/blocks.13/self_attn/Constant_41_output_0#/blocks.13/self_attn/Mul_4_output_0/blocks.13/self_attn/Mul_4"Mul  '/blocks.13/self_attn/Reshape_3_output_0 #/blocks.13/self_attn/Mul_4_output_0#/blocks.13/self_attn/Equal_output_0/blocks.13/self_attn/Equal"Equal  #/blocks.13/self_attn/Equal_output_0 -/blocks.13/self_attn/ConstantOfShape_output_0 '/blocks.13/self_attn/Reshape_3_output_0#/blocks.13/self_attn/Where_output_0/blocks.13/self_attn/Where"Where  */blocks.13/self_attn/Unsqueeze_12_output_0 #/blocks.13/self_attn/Where_output_0$/blocks.13/self_attn/Expand_output_0/blocks.13/self_attn/Expand"Expand )/blocks.13/self_attn/Constant_42_output_0 /blocks.13/self_attn/Constant_42"Constant*F value*:B,/blocks.13/self_attn/Constant_42_attr::valueJ  &/blocks.13/self_attn/Gather_7_output_0 )/blocks.13/self_attn/Constant_42_output_0#/blocks.13/self_attn/Mul_5_output_0/blocks.13/self_attn/Mul_5"Mul fonnx::Unsqueeze_4315 Constant_6114"Constant*5 value*)BConstant_6114_attr::valueJ  &/blocks.13/self_attn/Gather_6_output_0 onnx::Unsqueeze_4315*/blocks.13/self_attn/Unsqueeze_17_output_0!/blocks.13/self_attn/Unsqueeze_17" Unsqueeze fonnx::Unsqueeze_4317 Constant_6116"Constant*5 value*)BConstant_6116_attr::valueJ  #/blocks.13/self_attn/Mul_5_output_0 onnx::Unsqueeze_4317*/blocks.13/self_attn/Unsqueeze_18_output_0!/blocks.13/self_attn/Unsqueeze_18" Unsqueeze fonnx::Unsqueeze_4319 Constant_6118"Constant*5 value*)BConstant_6118_attr::valueJ  &/blocks.13/self_attn/Gather_8_output_0 onnx::Unsqueeze_4319*/blocks.13/self_attn/Unsqueeze_19_output_0!/blocks.13/self_attn/Unsqueeze_19" Unsqueeze fonnx::Unsqueeze_4321 Constant_6120"Constant*5 value*)BConstant_6120_attr::valueJ  &/blocks.13/self_attn/Gather_9_output_0 onnx::Unsqueeze_4321*/blocks.13/self_attn/Unsqueeze_20_output_0!/blocks.13/self_attn/Unsqueeze_20" Unsqueeze  */blocks.13/self_attn/Unsqueeze_17_output_0 */blocks.13/self_attn/Unsqueeze_18_output_0 */blocks.13/self_attn/Unsqueeze_19_output_0 */blocks.13/self_attn/Unsqueeze_20_output_0&/blocks.13/self_attn/Concat_9_output_0/blocks.13/self_attn/Concat_9"Concat* axis  $/blocks.13/self_attn/Expand_output_0 &/blocks.13/self_attn/Concat_9_output_0'/blocks.13/self_attn/Reshape_4_output_0/blocks.13/self_attn/Reshape_4"Reshape* allowzero w )/blocks.13/self_attn/Transpose_2_output_0%/blocks.13/self_attn/Shape_9_output_0/blocks.13/self_attn/Shape_9"Shape )/blocks.13/self_attn/Constant_43_output_0 /blocks.13/self_attn/Constant_43"Constant*F value*:B,/blocks.13/self_attn/Constant_43_attr::valueJ  %/blocks.13/self_attn/Shape_9_output_0 )/blocks.13/self_attn/Constant_43_output_0'/blocks.13/self_attn/Gather_10_output_0/blocks.13/self_attn/Gather_10"Gather* axis y )/blocks.13/self_attn/Transpose_2_output_0&/blocks.13/self_attn/Shape_10_output_0/blocks.13/self_attn/Shape_10"Shape )/blocks.13/self_attn/Constant_44_output_0 /blocks.13/self_attn/Constant_44"Constant*F value*:B,/blocks.13/self_attn/Constant_44_attr::valueJ  &/blocks.13/self_attn/Shape_10_output_0 )/blocks.13/self_attn/Constant_44_output_0'/blocks.13/self_attn/Gather_11_output_0/blocks.13/self_attn/Gather_11"Gather* axis y )/blocks.13/self_attn/Transpose_2_output_0&/blocks.13/self_attn/Shape_11_output_0/blocks.13/self_attn/Shape_11"Shape )/blocks.13/self_attn/Constant_45_output_0 /blocks.13/self_attn/Constant_45"Constant*F value*:B,/blocks.13/self_attn/Constant_45_attr::valueJ  &/blocks.13/self_attn/Shape_11_output_0 )/blocks.13/self_attn/Constant_45_output_0'/blocks.13/self_attn/Gather_12_output_0/blocks.13/self_attn/Gather_12"Gather* axis y )/blocks.13/self_attn/Transpose_2_output_0&/blocks.13/self_attn/Shape_12_output_0/blocks.13/self_attn/Shape_12"Shape )/blocks.13/self_attn/Constant_46_output_0 /blocks.13/self_attn/Constant_46"Constant*F value*:B,/blocks.13/self_attn/Constant_46_attr::valueJ  &/blocks.13/self_attn/Shape_12_output_0 )/blocks.13/self_attn/Constant_46_output_0'/blocks.13/self_attn/Gather_13_output_0/blocks.13/self_attn/Gather_13"Gather* axis )/blocks.13/self_attn/Constant_47_output_0 /blocks.13/self_attn/Constant_47"Constant*H value*<B,/blocks.13/self_attn/Constant_47_attr::valueJ  )/blocks.13/self_attn/Transpose_2_output_0 )/blocks.13/self_attn/Constant_47_output_0*/blocks.13/self_attn/Unsqueeze_21_output_0!/blocks.13/self_attn/Unsqueeze_21" Unsqueeze )/blocks.13/self_attn/Constant_48_output_0 /blocks.13/self_attn/Constant_48"Constant*H value*<B,/blocks.13/self_attn/Constant_48_attr::valueJ  '/blocks.13/self_attn/Gather_10_output_0 )/blocks.13/self_attn/Constant_48_output_0*/blocks.13/self_attn/Unsqueeze_22_output_0!/blocks.13/self_attn/Unsqueeze_22" Unsqueeze )/blocks.13/self_attn/Constant_49_output_0 /blocks.13/self_attn/Constant_49"Constant*H value*<B,/blocks.13/self_attn/Constant_49_attr::valueJ  '/blocks.13/self_attn/Gather_11_output_0 )/blocks.13/self_attn/Constant_49_output_0*/blocks.13/self_attn/Unsqueeze_23_output_0!/blocks.13/self_attn/Unsqueeze_23" Unsqueeze )/blocks.13/self_attn/Constant_50_output_0 /blocks.13/self_attn/Constant_50"Constant*H value*<B,/blocks.13/self_attn/Constant_50_attr::valueJ )/blocks.13/self_attn/Constant_51_output_0 /blocks.13/self_attn/Constant_51"Constant*H value*<B,/blocks.13/self_attn/Constant_51_attr::valueJ  '/blocks.13/self_attn/Gather_12_output_0 )/blocks.13/self_attn/Constant_51_output_0*/blocks.13/self_attn/Unsqueeze_24_output_0!/blocks.13/self_attn/Unsqueeze_24" Unsqueeze )/blocks.13/self_attn/Constant_52_output_0 /blocks.13/self_attn/Constant_52"Constant*H value*<B,/blocks.13/self_attn/Constant_52_attr::valueJ  '/blocks.13/self_attn/Gather_13_output_0 )/blocks.13/self_attn/Constant_52_output_0*/blocks.13/self_attn/Unsqueeze_25_output_0!/blocks.13/self_attn/Unsqueeze_25" Unsqueeze  */blocks.13/self_attn/Unsqueeze_22_output_0 */blocks.13/self_attn/Unsqueeze_23_output_0 )/blocks.13/self_attn/Constant_50_output_0 */blocks.13/self_attn/Unsqueeze_24_output_0 */blocks.13/self_attn/Unsqueeze_25_output_0'/blocks.13/self_attn/Concat_10_output_0/blocks.13/self_attn/Concat_10"Concat* axis )/blocks.13/self_attn/Constant_53_output_0 /blocks.13/self_attn/Constant_53"Constant*H value*<B,/blocks.13/self_attn/Constant_53_attr::valueJ  '/blocks.13/self_attn/Concat_10_output_0 )/blocks.13/self_attn/Constant_53_output_0'/blocks.13/self_attn/Reshape_5_output_0/blocks.13/self_attn/Reshape_5"Reshape* allowzero w '/blocks.13/self_attn/Reshape_5_output_0&/blocks.13/self_attn/Shape_13_output_0/blocks.13/self_attn/Shape_13"Shape  &/blocks.13/self_attn/Shape_13_output_0//blocks.13/self_attn/ConstantOfShape_1_output_0&/blocks.13/self_attn/ConstantOfShape_1"ConstantOfShape*N value*BB2/blocks.13/self_attn/ConstantOfShape_1_attr::valueJ )/blocks.13/self_attn/Constant_54_output_0 /blocks.13/self_attn/Constant_54"Constant*F value*:B,/blocks.13/self_attn/Constant_54_attr::valueJ  //blocks.13/self_attn/ConstantOfShape_1_output_0 )/blocks.13/self_attn/Constant_54_output_0#/blocks.13/self_attn/Mul_6_output_0/blocks.13/self_attn/Mul_6"Mul  '/blocks.13/self_attn/Reshape_5_output_0 #/blocks.13/self_attn/Mul_6_output_0%/blocks.13/self_attn/Equal_1_output_0/blocks.13/self_attn/Equal_1"Equal  %/blocks.13/self_attn/Equal_1_output_0 //blocks.13/self_attn/ConstantOfShape_1_output_0 '/blocks.13/self_attn/Reshape_5_output_0%/blocks.13/self_attn/Where_1_output_0/blocks.13/self_attn/Where_1"Where  */blocks.13/self_attn/Unsqueeze_21_output_0 %/blocks.13/self_attn/Where_1_output_0&/blocks.13/self_attn/Expand_1_output_0/blocks.13/self_attn/Expand_1"Expand )/blocks.13/self_attn/Constant_55_output_0 /blocks.13/self_attn/Constant_55"Constant*F value*:B,/blocks.13/self_attn/Constant_55_attr::valueJ  '/blocks.13/self_attn/Gather_11_output_0 )/blocks.13/self_attn/Constant_55_output_0#/blocks.13/self_attn/Mul_7_output_0/blocks.13/self_attn/Mul_7"Mul fonnx::Unsqueeze_4361 Constant_6159"Constant*5 value*)BConstant_6159_attr::valueJ  '/blocks.13/self_attn/Gather_10_output_0 onnx::Unsqueeze_4361*/blocks.13/self_attn/Unsqueeze_26_output_0!/blocks.13/self_attn/Unsqueeze_26" Unsqueeze fonnx::Unsqueeze_4363 Constant_6161"Constant*5 value*)BConstant_6161_attr::valueJ  #/blocks.13/self_attn/Mul_7_output_0 onnx::Unsqueeze_4363*/blocks.13/self_attn/Unsqueeze_27_output_0!/blocks.13/self_attn/Unsqueeze_27" Unsqueeze fonnx::Unsqueeze_4365 Constant_6163"Constant*5 value*)BConstant_6163_attr::valueJ  '/blocks.13/self_attn/Gather_12_output_0 onnx::Unsqueeze_4365*/blocks.13/self_attn/Unsqueeze_28_output_0!/blocks.13/self_attn/Unsqueeze_28" Unsqueeze fonnx::Unsqueeze_4367 Constant_6165"Constant*5 value*)BConstant_6165_attr::valueJ  '/blocks.13/self_attn/Gather_13_output_0 onnx::Unsqueeze_4367*/blocks.13/self_attn/Unsqueeze_29_output_0!/blocks.13/self_attn/Unsqueeze_29" Unsqueeze  */blocks.13/self_attn/Unsqueeze_26_output_0 */blocks.13/self_attn/Unsqueeze_27_output_0 */blocks.13/self_attn/Unsqueeze_28_output_0 */blocks.13/self_attn/Unsqueeze_29_output_0'/blocks.13/self_attn/Concat_11_output_0/blocks.13/self_attn/Concat_11"Concat* axis  &/blocks.13/self_attn/Expand_1_output_0 '/blocks.13/self_attn/Concat_11_output_0'/blocks.13/self_attn/Reshape_6_output_0/blocks.13/self_attn/Reshape_6"Reshape* allowzero  '/blocks.13/self_attn/Transpose_output_0 '/blocks.13/self_attn/Reshape_4_output_0$/blocks.13/self_attn/MatMul_output_0/blocks.13/self_attn/MatMul"MatMul )/blocks.13/self_attn/Constant_56_output_0 /blocks.13/self_attn/Constant_56"Constant*B value*6B,/blocks.13/self_attn/Constant_56_attr::valueJ5A  $/blocks.13/self_attn/MatMul_output_0 )/blocks.13/self_attn/Constant_56_output_0#/blocks.13/self_attn/Div_2_output_0/blocks.13/self_attn/Div_2"Div { #/blocks.13/self_attn/Div_2_output_0 attention_mask#/blocks.13/self_attn/Add_2_output_0/blocks.13/self_attn/Add_2"Add  #/blocks.13/self_attn/Add_2_output_0%/blocks.13/self_attn/Softmax_output_0/blocks.13/self_attn/Softmax"Softmax* axis { %/blocks.13/self_attn/Softmax_output_0$/blocks.13/self_attn/Cast_4_output_0/blocks.13/self_attn/Cast_4"Cast* to  $/blocks.13/self_attn/Cast_4_output_0 '/blocks.13/self_attn/Reshape_6_output_0&/blocks.13/self_attn/MatMul_1_output_0/blocks.13/self_attn/MatMul_1"MatMul  &/blocks.13/self_attn/MatMul_1_output_0)/blocks.13/self_attn/Transpose_3_output_0 /blocks.13/self_attn/Transpose_3" Transpose* perm@@@@ fonnx::Unsqueeze_4379 Constant_6177"Constant*5 value*)BConstant_6177_attr::valueJ  $/blocks.13/self_attn/Gather_output_0 onnx::Unsqueeze_4379*/blocks.13/self_attn/Unsqueeze_30_output_0!/blocks.13/self_attn/Unsqueeze_30" Unsqueeze fonnx::Unsqueeze_4381 Constant_6179"Constant*5 value*)BConstant_6179_attr::valueJ  &/blocks.13/self_attn/Gather_1_output_0 onnx::Unsqueeze_4381*/blocks.13/self_attn/Unsqueeze_31_output_0!/blocks.13/self_attn/Unsqueeze_31" Unsqueeze )/blocks.13/self_attn/Constant_57_output_0 /blocks.13/self_attn/Constant_57"Constant*H value*<B,/blocks.13/self_attn/Constant_57_attr::valueJ  */blocks.13/self_attn/Unsqueeze_30_output_0 */blocks.13/self_attn/Unsqueeze_31_output_0 )/blocks.13/self_attn/Constant_57_output_0'/blocks.13/self_attn/Concat_12_output_0/blocks.13/self_attn/Concat_12"Concat* axis  )/blocks.13/self_attn/Transpose_3_output_0 '/blocks.13/self_attn/Concat_12_output_0'/blocks.13/self_attn/Reshape_7_output_0/blocks.13/self_attn/Reshape_7"Reshape* allowzero  '/blocks.13/self_attn/Reshape_7_output_0 onnx::MatMul_8953+/blocks.13/self_attn/o_proj/MatMul_output_0"/blocks.13/self_attn/o_proj/MatMul"MatMul  */blocks.13/input_layernorm/Cast_1_output_0 +/blocks.13/self_attn/o_proj/MatMul_output_0/blocks.13/Add_output_0/blocks.13/Add"Add  /blocks.13/Add_output_01/blocks.13/post_attention_layernorm/Cast_output_0(/blocks.13/post_attention_layernorm/Cast"Cast* to 5/blocks.13/post_attention_layernorm/Constant_output_0,/blocks.13/post_attention_layernorm/Constant"Constant*N value*BB8/blocks.13/post_attention_layernorm/Constant_attr::valueJ@  1/blocks.13/post_attention_layernorm/Cast_output_0 5/blocks.13/post_attention_layernorm/Constant_output_00/blocks.13/post_attention_layernorm/Pow_output_0'/blocks.13/post_attention_layernorm/Pow"Pow  0/blocks.13/post_attention_layernorm/Pow_output_07/blocks.13/post_attention_layernorm/ReduceMean_output_0./blocks.13/post_attention_layernorm/ReduceMean" ReduceMean* axes@* keepdims 7/blocks.13/post_attention_layernorm/Constant_1_output_0./blocks.13/post_attention_layernorm/Constant_1"Constant*P value*DB:/blocks.13/post_attention_layernorm/Constant_1_attr::valueJ75  7/blocks.13/post_attention_layernorm/ReduceMean_output_0 7/blocks.13/post_attention_layernorm/Constant_1_output_00/blocks.13/post_attention_layernorm/Add_output_0'/blocks.13/post_attention_layernorm/Add"Add  0/blocks.13/post_attention_layernorm/Add_output_01/blocks.13/post_attention_layernorm/Sqrt_output_0(/blocks.13/post_attention_layernorm/Sqrt"Sqrt 7/blocks.13/post_attention_layernorm/Constant_2_output_0./blocks.13/post_attention_layernorm/Constant_2"Constant*P value*DB:/blocks.13/post_attention_layernorm/Constant_2_attr::valueJ?  7/blocks.13/post_attention_layernorm/Constant_2_output_0 1/blocks.13/post_attention_layernorm/Sqrt_output_00/blocks.13/post_attention_layernorm/Div_output_0'/blocks.13/post_attention_layernorm/Div"Div  1/blocks.13/post_attention_layernorm/Cast_output_03/blocks.13/post_attention_layernorm/Cast_1_output_0*/blocks.13/post_attention_layernorm/Cast_1"Cast* to  3/blocks.13/post_attention_layernorm/Cast_1_output_0 0/blocks.13/post_attention_layernorm/Div_output_00/blocks.13/post_attention_layernorm/Mul_output_0'/blocks.13/post_attention_layernorm/Mul"Mul  0/blocks.13/post_attention_layernorm/Mul_output_0 )blocks.13.post_attention_layernorm.weight2/blocks.13/post_attention_layernorm/Mul_1_output_0)/blocks.13/post_attention_layernorm/Mul_1"Mul  2/blocks.13/post_attention_layernorm/Mul_1_output_03/blocks.13/post_attention_layernorm/Cast_2_output_0*/blocks.13/post_attention_layernorm/Cast_2"Cast* to  3/blocks.13/post_attention_layernorm/Cast_2_output_0 onnx::MatMul_8954(/blocks.13/mlp/gate_proj/MatMul_output_0/blocks.13/mlp/gate_proj/MatMul"MatMul z (/blocks.13/mlp/gate_proj/MatMul_output_0&/blocks.13/mlp/act_fn/Sigmoid_output_0/blocks.13/mlp/act_fn/Sigmoid"Sigmoid  (/blocks.13/mlp/gate_proj/MatMul_output_0 &/blocks.13/mlp/act_fn/Sigmoid_output_0"/blocks.13/mlp/act_fn/Mul_output_0/blocks.13/mlp/act_fn/Mul"Mul  3/blocks.13/post_attention_layernorm/Cast_2_output_0 onnx::MatMul_8955&/blocks.13/mlp/up_proj/MatMul_output_0/blocks.13/mlp/up_proj/MatMul"MatMul  "/blocks.13/mlp/act_fn/Mul_output_0 &/blocks.13/mlp/up_proj/MatMul_output_0/blocks.13/mlp/Mul_output_0/blocks.13/mlp/Mul"Mul  /blocks.13/mlp/Mul_output_0 onnx::MatMul_8956(/blocks.13/mlp/down_proj/MatMul_output_0/blocks.13/mlp/down_proj/MatMul"MatMul  3/blocks.13/post_attention_layernorm/Cast_1_output_0 (/blocks.13/mlp/down_proj/MatMul_output_0/blocks.13/Add_1_output_0/blocks.13/Add_1"Add `/Constant_7_output_0 /Constant_7"Constant*1 value*%B/Constant_7_attr::valueJ ] past_key_values /Constant_7_output_0/Gather_14_output_0 /Gather_14"Gather* axis /blocks.14/Constant_output_0/blocks.14/Constant"Constant*K value*?B/blocks.14/Constant_attr::valueJ  /blocks.13/Add_1_output_0 /blocks.14/Constant_output_0/blocks.14/Reshape_output_0/blocks.14/Reshape"Reshape* allowzero y /blocks.14/Reshape_output_0(/blocks.14/input_layernorm/Cast_output_0/blocks.14/input_layernorm/Cast"Cast* to ,/blocks.14/input_layernorm/Constant_output_0#/blocks.14/input_layernorm/Constant"Constant*E value*9B//blocks.14/input_layernorm/Constant_attr::valueJ@  (/blocks.14/input_layernorm/Cast_output_0 ,/blocks.14/input_layernorm/Constant_output_0'/blocks.14/input_layernorm/Pow_output_0/blocks.14/input_layernorm/Pow"Pow  '/blocks.14/input_layernorm/Pow_output_0./blocks.14/input_layernorm/ReduceMean_output_0%/blocks.14/input_layernorm/ReduceMean" ReduceMean* axes@* keepdims ./blocks.14/input_layernorm/Constant_1_output_0%/blocks.14/input_layernorm/Constant_1"Constant*G value*;B1/blocks.14/input_layernorm/Constant_1_attr::valueJ75  ./blocks.14/input_layernorm/ReduceMean_output_0 ./blocks.14/input_layernorm/Constant_1_output_0'/blocks.14/input_layernorm/Add_output_0/blocks.14/input_layernorm/Add"Add z '/blocks.14/input_layernorm/Add_output_0(/blocks.14/input_layernorm/Sqrt_output_0/blocks.14/input_layernorm/Sqrt"Sqrt ./blocks.14/input_layernorm/Constant_2_output_0%/blocks.14/input_layernorm/Constant_2"Constant*G value*;B1/blocks.14/input_layernorm/Constant_2_attr::valueJ?  ./blocks.14/input_layernorm/Constant_2_output_0 (/blocks.14/input_layernorm/Sqrt_output_0'/blocks.14/input_layernorm/Div_output_0/blocks.14/input_layernorm/Div"Div  (/blocks.14/input_layernorm/Cast_output_0*/blocks.14/input_layernorm/Cast_1_output_0!/blocks.14/input_layernorm/Cast_1"Cast* to  */blocks.14/input_layernorm/Cast_1_output_0 '/blocks.14/input_layernorm/Div_output_0'/blocks.14/input_layernorm/Mul_output_0/blocks.14/input_layernorm/Mul"Mul  '/blocks.14/input_layernorm/Mul_output_0 blocks.14.input_layernorm.weight)/blocks.14/input_layernorm/Mul_1_output_0 /blocks.14/input_layernorm/Mul_1"Mul  )/blocks.14/input_layernorm/Mul_1_output_0*/blocks.14/input_layernorm/Cast_2_output_0!/blocks.14/input_layernorm/Cast_2"Cast* to t */blocks.14/input_layernorm/Cast_2_output_0#/blocks.14/self_attn/Shape_output_0/blocks.14/self_attn/Shape"Shape &/blocks.14/self_attn/Constant_output_0/blocks.14/self_attn/Constant"Constant*C value*7B)/blocks.14/self_attn/Constant_attr::valueJ  #/blocks.14/self_attn/Shape_output_0 &/blocks.14/self_attn/Constant_output_0$/blocks.14/self_attn/Gather_output_0/blocks.14/self_attn/Gather"Gather* axis x */blocks.14/input_layernorm/Cast_2_output_0%/blocks.14/self_attn/Shape_1_output_0/blocks.14/self_attn/Shape_1"Shape (/blocks.14/self_attn/Constant_1_output_0/blocks.14/self_attn/Constant_1"Constant*E value*9B+/blocks.14/self_attn/Constant_1_attr::valueJ  %/blocks.14/self_attn/Shape_1_output_0 (/blocks.14/self_attn/Constant_1_output_0&/blocks.14/self_attn/Gather_1_output_0/blocks.14/self_attn/Gather_1"Gather* axis  */blocks.14/input_layernorm/Cast_2_output_0 onnx::MatMul_8957+/blocks.14/self_attn/q_proj/MatMul_output_0"/blocks.14/self_attn/q_proj/MatMul"MatMul  */blocks.14/input_layernorm/Cast_2_output_0 onnx::MatMul_8958+/blocks.14/self_attn/k_proj/MatMul_output_0"/blocks.14/self_attn/k_proj/MatMul"MatMul  */blocks.14/input_layernorm/Cast_2_output_0 onnx::MatMul_8959+/blocks.14/self_attn/v_proj/MatMul_output_0"/blocks.14/self_attn/v_proj/MatMul"MatMul fonnx::Unsqueeze_4442 Constant_6232"Constant*5 value*)BConstant_6232_attr::valueJ  $/blocks.14/self_attn/Gather_output_0 onnx::Unsqueeze_4442'/blocks.14/self_attn/Unsqueeze_output_0/blocks.14/self_attn/Unsqueeze" Unsqueeze fonnx::Unsqueeze_4444 Constant_6234"Constant*5 value*)BConstant_6234_attr::valueJ  &/blocks.14/self_attn/Gather_1_output_0 onnx::Unsqueeze_4444)/blocks.14/self_attn/Unsqueeze_1_output_0 /blocks.14/self_attn/Unsqueeze_1" Unsqueeze (/blocks.14/self_attn/Constant_2_output_0/blocks.14/self_attn/Constant_2"Constant*G value*;B+/blocks.14/self_attn/Constant_2_attr::valueJ (/blocks.14/self_attn/Constant_3_output_0/blocks.14/self_attn/Constant_3"Constant*G value*;B+/blocks.14/self_attn/Constant_3_attr::valueJ  '/blocks.14/self_attn/Unsqueeze_output_0 )/blocks.14/self_attn/Unsqueeze_1_output_0 (/blocks.14/self_attn/Constant_2_output_0 (/blocks.14/self_attn/Constant_3_output_0$/blocks.14/self_attn/Concat_output_0/blocks.14/self_attn/Concat"Concat* axis  +/blocks.14/self_attn/q_proj/MatMul_output_0 $/blocks.14/self_attn/Concat_output_0%/blocks.14/self_attn/Reshape_output_0/blocks.14/self_attn/Reshape"Reshape* allowzero fonnx::Unsqueeze_4452 Constant_6240"Constant*5 value*)BConstant_6240_attr::valueJ  $/blocks.14/self_attn/Gather_output_0 onnx::Unsqueeze_4452)/blocks.14/self_attn/Unsqueeze_2_output_0 /blocks.14/self_attn/Unsqueeze_2" Unsqueeze fonnx::Unsqueeze_4454 Constant_6242"Constant*5 value*)BConstant_6242_attr::valueJ  &/blocks.14/self_attn/Gather_1_output_0 onnx::Unsqueeze_4454)/blocks.14/self_attn/Unsqueeze_3_output_0 /blocks.14/self_attn/Unsqueeze_3" Unsqueeze (/blocks.14/self_attn/Constant_4_output_0/blocks.14/self_attn/Constant_4"Constant*G value*;B+/blocks.14/self_attn/Constant_4_attr::valueJ (/blocks.14/self_attn/Constant_5_output_0/blocks.14/self_attn/Constant_5"Constant*G value*;B+/blocks.14/self_attn/Constant_5_attr::valueJ  )/blocks.14/self_attn/Unsqueeze_2_output_0 )/blocks.14/self_attn/Unsqueeze_3_output_0 (/blocks.14/self_attn/Constant_4_output_0 (/blocks.14/self_attn/Constant_5_output_0&/blocks.14/self_attn/Concat_1_output_0/blocks.14/self_attn/Concat_1"Concat* axis fonnx::Unsqueeze_4461 Constant_6247"Constant*5 value*)BConstant_6247_attr::valueJ  $/blocks.14/self_attn/Gather_output_0 onnx::Unsqueeze_4461)/blocks.14/self_attn/Unsqueeze_4_output_0 /blocks.14/self_attn/Unsqueeze_4" Unsqueeze fonnx::Unsqueeze_4463 Constant_6249"Constant*5 value*)BConstant_6249_attr::valueJ  &/blocks.14/self_attn/Gather_1_output_0 onnx::Unsqueeze_4463)/blocks.14/self_attn/Unsqueeze_5_output_0 /blocks.14/self_attn/Unsqueeze_5" Unsqueeze (/blocks.14/self_attn/Constant_6_output_0/blocks.14/self_attn/Constant_6"Constant*G value*;B+/blocks.14/self_attn/Constant_6_attr::valueJ (/blocks.14/self_attn/Constant_7_output_0/blocks.14/self_attn/Constant_7"Constant*G value*;B+/blocks.14/self_attn/Constant_7_attr::valueJ  )/blocks.14/self_attn/Unsqueeze_4_output_0 )/blocks.14/self_attn/Unsqueeze_5_output_0 (/blocks.14/self_attn/Constant_6_output_0 (/blocks.14/self_attn/Constant_7_output_0&/blocks.14/self_attn/Concat_2_output_0/blocks.14/self_attn/Concat_2"Concat* axis  +/blocks.14/self_attn/k_proj/MatMul_output_0 &/blocks.14/self_attn/Concat_1_output_0'/blocks.14/self_attn/Reshape_1_output_0/blocks.14/self_attn/Reshape_1"Reshape* allowzero  +/blocks.14/self_attn/v_proj/MatMul_output_0 &/blocks.14/self_attn/Concat_2_output_0'/blocks.14/self_attn/Reshape_2_output_0/blocks.14/self_attn/Reshape_2"Reshape* allowzero  %/blocks.14/self_attn/Reshape_output_0)/blocks.14/self_attn/q_norm/Cast_output_0 /blocks.14/self_attn/q_norm/Cast"Cast* to -/blocks.14/self_attn/q_norm/Constant_output_0$/blocks.14/self_attn/q_norm/Constant"Constant*F value*:B0/blocks.14/self_attn/q_norm/Constant_attr::valueJ@  )/blocks.14/self_attn/q_norm/Cast_output_0 -/blocks.14/self_attn/q_norm/Constant_output_0(/blocks.14/self_attn/q_norm/Pow_output_0/blocks.14/self_attn/q_norm/Pow"Pow  (/blocks.14/self_attn/q_norm/Pow_output_0//blocks.14/self_attn/q_norm/ReduceMean_output_0&/blocks.14/self_attn/q_norm/ReduceMean" ReduceMean* axes@* keepdims //blocks.14/self_attn/q_norm/Constant_1_output_0&/blocks.14/self_attn/q_norm/Constant_1"Constant*H value*<B2/blocks.14/self_attn/q_norm/Constant_1_attr::valueJ75  //blocks.14/self_attn/q_norm/ReduceMean_output_0 //blocks.14/self_attn/q_norm/Constant_1_output_0(/blocks.14/self_attn/q_norm/Add_output_0/blocks.14/self_attn/q_norm/Add"Add } (/blocks.14/self_attn/q_norm/Add_output_0)/blocks.14/self_attn/q_norm/Sqrt_output_0 /blocks.14/self_attn/q_norm/Sqrt"Sqrt //blocks.14/self_attn/q_norm/Constant_2_output_0&/blocks.14/self_attn/q_norm/Constant_2"Constant*H value*<B2/blocks.14/self_attn/q_norm/Constant_2_attr::valueJ?  //blocks.14/self_attn/q_norm/Constant_2_output_0 )/blocks.14/self_attn/q_norm/Sqrt_output_0(/blocks.14/self_attn/q_norm/Div_output_0/blocks.14/self_attn/q_norm/Div"Div  )/blocks.14/self_attn/q_norm/Cast_output_0+/blocks.14/self_attn/q_norm/Cast_1_output_0"/blocks.14/self_attn/q_norm/Cast_1"Cast* to  +/blocks.14/self_attn/q_norm/Cast_1_output_0 (/blocks.14/self_attn/q_norm/Div_output_0(/blocks.14/self_attn/q_norm/Mul_output_0/blocks.14/self_attn/q_norm/Mul"Mul  (/blocks.14/self_attn/q_norm/Mul_output_0 !blocks.14.self_attn.q_norm.weight*/blocks.14/self_attn/q_norm/Mul_1_output_0!/blocks.14/self_attn/q_norm/Mul_1"Mul  */blocks.14/self_attn/q_norm/Mul_1_output_0+/blocks.14/self_attn/q_norm/Cast_2_output_0"/blocks.14/self_attn/q_norm/Cast_2"Cast* to  '/blocks.14/self_attn/Reshape_1_output_0)/blocks.14/self_attn/k_norm/Cast_output_0 /blocks.14/self_attn/k_norm/Cast"Cast* to -/blocks.14/self_attn/k_norm/Constant_output_0$/blocks.14/self_attn/k_norm/Constant"Constant*F value*:B0/blocks.14/self_attn/k_norm/Constant_attr::valueJ@  )/blocks.14/self_attn/k_norm/Cast_output_0 -/blocks.14/self_attn/k_norm/Constant_output_0(/blocks.14/self_attn/k_norm/Pow_output_0/blocks.14/self_attn/k_norm/Pow"Pow  (/blocks.14/self_attn/k_norm/Pow_output_0//blocks.14/self_attn/k_norm/ReduceMean_output_0&/blocks.14/self_attn/k_norm/ReduceMean" ReduceMean* axes@* keepdims //blocks.14/self_attn/k_norm/Constant_1_output_0&/blocks.14/self_attn/k_norm/Constant_1"Constant*H value*<B2/blocks.14/self_attn/k_norm/Constant_1_attr::valueJ75  //blocks.14/self_attn/k_norm/ReduceMean_output_0 //blocks.14/self_attn/k_norm/Constant_1_output_0(/blocks.14/self_attn/k_norm/Add_output_0/blocks.14/self_attn/k_norm/Add"Add } (/blocks.14/self_attn/k_norm/Add_output_0)/blocks.14/self_attn/k_norm/Sqrt_output_0 /blocks.14/self_attn/k_norm/Sqrt"Sqrt //blocks.14/self_attn/k_norm/Constant_2_output_0&/blocks.14/self_attn/k_norm/Constant_2"Constant*H value*<B2/blocks.14/self_attn/k_norm/Constant_2_attr::valueJ?  //blocks.14/self_attn/k_norm/Constant_2_output_0 )/blocks.14/self_attn/k_norm/Sqrt_output_0(/blocks.14/self_attn/k_norm/Div_output_0/blocks.14/self_attn/k_norm/Div"Div  )/blocks.14/self_attn/k_norm/Cast_output_0+/blocks.14/self_attn/k_norm/Cast_1_output_0"/blocks.14/self_attn/k_norm/Cast_1"Cast* to  +/blocks.14/self_attn/k_norm/Cast_1_output_0 (/blocks.14/self_attn/k_norm/Div_output_0(/blocks.14/self_attn/k_norm/Mul_output_0/blocks.14/self_attn/k_norm/Mul"Mul  (/blocks.14/self_attn/k_norm/Mul_output_0 !blocks.14.self_attn.k_norm.weight*/blocks.14/self_attn/k_norm/Mul_1_output_0!/blocks.14/self_attn/k_norm/Mul_1"Mul  */blocks.14/self_attn/k_norm/Mul_1_output_0+/blocks.14/self_attn/k_norm/Cast_2_output_0"/blocks.14/self_attn/k_norm/Cast_2"Cast* to  +/blocks.14/self_attn/q_norm/Cast_2_output_0 %/blocks.0/self_attn/Gather_2_output_0!/blocks.14/self_attn/Mul_output_0/blocks.14/self_attn/Mul"Mul y +/blocks.14/self_attn/q_norm/Cast_2_output_0%/blocks.14/self_attn/Shape_2_output_0/blocks.14/self_attn/Shape_2"Shape (/blocks.14/self_attn/Constant_8_output_0/blocks.14/self_attn/Constant_8"Constant*E value*9B+/blocks.14/self_attn/Constant_8_attr::valueJ  %/blocks.14/self_attn/Shape_2_output_0 (/blocks.14/self_attn/Constant_8_output_0&/blocks.14/self_attn/Gather_2_output_0/blocks.14/self_attn/Gather_2"Gather* axis (/blocks.14/self_attn/Constant_9_output_0/blocks.14/self_attn/Constant_9"Constant*E value*9B+/blocks.14/self_attn/Constant_9_attr::valueJ  &/blocks.14/self_attn/Gather_2_output_0 (/blocks.14/self_attn/Constant_9_output_0!/blocks.14/self_attn/Div_output_0/blocks.14/self_attn/Div"Div s !/blocks.14/self_attn/Div_output_0"/blocks.14/self_attn/Cast_output_0/blocks.14/self_attn/Cast"Cast* to x "/blocks.14/self_attn/Cast_output_0$/blocks.14/self_attn/Cast_1_output_0/blocks.14/self_attn/Cast_1"Cast* to )/blocks.14/self_attn/Constant_10_output_0 /blocks.14/self_attn/Constant_10"Constant*H value*<B,/blocks.14/self_attn/Constant_10_attr::valueJ )/blocks.14/self_attn/Constant_11_output_0 /blocks.14/self_attn/Constant_11"Constant*H value*<B,/blocks.14/self_attn/Constant_11_attr::valueJ )/blocks.14/self_attn/Constant_12_output_0 /blocks.14/self_attn/Constant_12"Constant*H value*<B,/blocks.14/self_attn/Constant_12_attr::valueJ  $/blocks.14/self_attn/Cast_1_output_0 )/blocks.14/self_attn/Constant_12_output_0)/blocks.14/self_attn/Unsqueeze_6_output_0 /blocks.14/self_attn/Unsqueeze_6" Unsqueeze )/blocks.14/self_attn/Constant_13_output_0 /blocks.14/self_attn/Constant_13"Constant*H value*<B,/blocks.14/self_attn/Constant_13_attr::valueJ  +/blocks.14/self_attn/q_norm/Cast_2_output_0 )/blocks.14/self_attn/Constant_11_output_0 )/blocks.14/self_attn/Unsqueeze_6_output_0 )/blocks.14/self_attn/Constant_10_output_0 )/blocks.14/self_attn/Constant_13_output_0#/blocks.14/self_attn/Slice_output_0/blocks.14/self_attn/Slice"Slice )/blocks.14/self_attn/Constant_14_output_0 /blocks.14/self_attn/Constant_14"Constant*H value*<B,/blocks.14/self_attn/Constant_14_attr::valueJ )/blocks.14/self_attn/Constant_15_output_0 /blocks.14/self_attn/Constant_15"Constant*H value*<B,/blocks.14/self_attn/Constant_15_attr::valueJ  $/blocks.14/self_attn/Cast_1_output_0 )/blocks.14/self_attn/Constant_15_output_0)/blocks.14/self_attn/Unsqueeze_7_output_0 /blocks.14/self_attn/Unsqueeze_7" Unsqueeze )/blocks.14/self_attn/Constant_16_output_0 /blocks.14/self_attn/Constant_16"Constant*H value*<B,/blocks.14/self_attn/Constant_16_attr::valueJ )/blocks.14/self_attn/Constant_17_output_0 /blocks.14/self_attn/Constant_17"Constant*H value*<B,/blocks.14/self_attn/Constant_17_attr::valueJ  +/blocks.14/self_attn/q_norm/Cast_2_output_0 )/blocks.14/self_attn/Unsqueeze_7_output_0 )/blocks.14/self_attn/Constant_16_output_0 )/blocks.14/self_attn/Constant_14_output_0 )/blocks.14/self_attn/Constant_17_output_0%/blocks.14/self_attn/Slice_1_output_0/blocks.14/self_attn/Slice_1"Slice i %/blocks.14/self_attn/Slice_1_output_0!/blocks.14/self_attn/Neg_output_0/blocks.14/self_attn/Neg"Neg  !/blocks.14/self_attn/Neg_output_0 #/blocks.14/self_attn/Slice_output_0&/blocks.14/self_attn/Concat_3_output_0/blocks.14/self_attn/Concat_3"Concat* axis  &/blocks.14/self_attn/Concat_3_output_0 %/blocks.0/self_attn/Gather_3_output_0#/blocks.14/self_attn/Mul_1_output_0/blocks.14/self_attn/Mul_1"Mul  !/blocks.14/self_attn/Mul_output_0 #/blocks.14/self_attn/Mul_1_output_0!/blocks.14/self_attn/Add_output_0/blocks.14/self_attn/Add"Add  +/blocks.14/self_attn/k_norm/Cast_2_output_0 %/blocks.0/self_attn/Gather_2_output_0#/blocks.14/self_attn/Mul_2_output_0/blocks.14/self_attn/Mul_2"Mul y +/blocks.14/self_attn/k_norm/Cast_2_output_0%/blocks.14/self_attn/Shape_3_output_0/blocks.14/self_attn/Shape_3"Shape )/blocks.14/self_attn/Constant_18_output_0 /blocks.14/self_attn/Constant_18"Constant*F value*:B,/blocks.14/self_attn/Constant_18_attr::valueJ  %/blocks.14/self_attn/Shape_3_output_0 )/blocks.14/self_attn/Constant_18_output_0&/blocks.14/self_attn/Gather_3_output_0/blocks.14/self_attn/Gather_3"Gather* axis )/blocks.14/self_attn/Constant_19_output_0 /blocks.14/self_attn/Constant_19"Constant*F value*:B,/blocks.14/self_attn/Constant_19_attr::valueJ  &/blocks.14/self_attn/Gather_3_output_0 )/blocks.14/self_attn/Constant_19_output_0#/blocks.14/self_attn/Div_1_output_0/blocks.14/self_attn/Div_1"Div y #/blocks.14/self_attn/Div_1_output_0$/blocks.14/self_attn/Cast_2_output_0/blocks.14/self_attn/Cast_2"Cast* to z $/blocks.14/self_attn/Cast_2_output_0$/blocks.14/self_attn/Cast_3_output_0/blocks.14/self_attn/Cast_3"Cast* to )/blocks.14/self_attn/Constant_20_output_0 /blocks.14/self_attn/Constant_20"Constant*H value*<B,/blocks.14/self_attn/Constant_20_attr::valueJ )/blocks.14/self_attn/Constant_21_output_0 /blocks.14/self_attn/Constant_21"Constant*H value*<B,/blocks.14/self_attn/Constant_21_attr::valueJ )/blocks.14/self_attn/Constant_22_output_0 /blocks.14/self_attn/Constant_22"Constant*H value*<B,/blocks.14/self_attn/Constant_22_attr::valueJ  $/blocks.14/self_attn/Cast_3_output_0 )/blocks.14/self_attn/Constant_22_output_0)/blocks.14/self_attn/Unsqueeze_8_output_0 /blocks.14/self_attn/Unsqueeze_8" Unsqueeze )/blocks.14/self_attn/Constant_23_output_0 /blocks.14/self_attn/Constant_23"Constant*H value*<B,/blocks.14/self_attn/Constant_23_attr::valueJ  +/blocks.14/self_attn/k_norm/Cast_2_output_0 )/blocks.14/self_attn/Constant_21_output_0 )/blocks.14/self_attn/Unsqueeze_8_output_0 )/blocks.14/self_attn/Constant_20_output_0 )/blocks.14/self_attn/Constant_23_output_0%/blocks.14/self_attn/Slice_2_output_0/blocks.14/self_attn/Slice_2"Slice )/blocks.14/self_attn/Constant_24_output_0 /blocks.14/self_attn/Constant_24"Constant*H value*<B,/blocks.14/self_attn/Constant_24_attr::valueJ )/blocks.14/self_attn/Constant_25_output_0 /blocks.14/self_attn/Constant_25"Constant*H value*<B,/blocks.14/self_attn/Constant_25_attr::valueJ  $/blocks.14/self_attn/Cast_3_output_0 )/blocks.14/self_attn/Constant_25_output_0)/blocks.14/self_attn/Unsqueeze_9_output_0 /blocks.14/self_attn/Unsqueeze_9" Unsqueeze )/blocks.14/self_attn/Constant_26_output_0 /blocks.14/self_attn/Constant_26"Constant*H value*<B,/blocks.14/self_attn/Constant_26_attr::valueJ )/blocks.14/self_attn/Constant_27_output_0 /blocks.14/self_attn/Constant_27"Constant*H value*<B,/blocks.14/self_attn/Constant_27_attr::valueJ  +/blocks.14/self_attn/k_norm/Cast_2_output_0 )/blocks.14/self_attn/Unsqueeze_9_output_0 )/blocks.14/self_attn/Constant_26_output_0 )/blocks.14/self_attn/Constant_24_output_0 )/blocks.14/self_attn/Constant_27_output_0%/blocks.14/self_attn/Slice_3_output_0/blocks.14/self_attn/Slice_3"Slice m %/blocks.14/self_attn/Slice_3_output_0#/blocks.14/self_attn/Neg_1_output_0/blocks.14/self_attn/Neg_1"Neg  #/blocks.14/self_attn/Neg_1_output_0 %/blocks.14/self_attn/Slice_2_output_0&/blocks.14/self_attn/Concat_4_output_0/blocks.14/self_attn/Concat_4"Concat* axis  &/blocks.14/self_attn/Concat_4_output_0 %/blocks.0/self_attn/Gather_3_output_0#/blocks.14/self_attn/Mul_3_output_0/blocks.14/self_attn/Mul_3"Mul  #/blocks.14/self_attn/Mul_2_output_0 #/blocks.14/self_attn/Mul_3_output_0#/blocks.14/self_attn/Add_1_output_0/blocks.14/self_attn/Add_1"Add  /Gather_14_output_0 /rotary/Constant_3_output_0&/blocks.14/self_attn/Gather_4_output_0/blocks.14/self_attn/Gather_4"Gather* axis  /Gather_14_output_0 /rotary/Constant_8_output_0&/blocks.14/self_attn/Gather_5_output_0/blocks.14/self_attn/Gather_5"Gather* axis  &/blocks.14/self_attn/Gather_4_output_0 #/blocks.14/self_attn/Add_1_output_0&/blocks.14/self_attn/Concat_5_output_0/blocks.14/self_attn/Concat_5"Concat* axis  &/blocks.14/self_attn/Gather_5_output_0 '/blocks.14/self_attn/Reshape_2_output_0&/blocks.14/self_attn/Concat_6_output_0/blocks.14/self_attn/Concat_6"Concat* axis )/blocks.14/self_attn/Constant_28_output_0 /blocks.14/self_attn/Constant_28"Constant*H value*<B,/blocks.14/self_attn/Constant_28_attr::valueJ  &/blocks.14/self_attn/Concat_5_output_0 )/blocks.14/self_attn/Constant_28_output_0*/blocks.14/self_attn/Unsqueeze_10_output_0!/blocks.14/self_attn/Unsqueeze_10" Unsqueeze )/blocks.14/self_attn/Constant_29_output_0 /blocks.14/self_attn/Constant_29"Constant*H value*<B,/blocks.14/self_attn/Constant_29_attr::valueJ  &/blocks.14/self_attn/Concat_6_output_0 )/blocks.14/self_attn/Constant_29_output_0*/blocks.14/self_attn/Unsqueeze_11_output_0!/blocks.14/self_attn/Unsqueeze_11" Unsqueeze  */blocks.14/self_attn/Unsqueeze_10_output_0 */blocks.14/self_attn/Unsqueeze_11_output_0&/blocks.14/self_attn/Concat_7_output_0/blocks.14/self_attn/Concat_7"Concat* axis  !/blocks.14/self_attn/Add_output_0'/blocks.14/self_attn/Transpose_output_0/blocks.14/self_attn/Transpose" Transpose* perm@@@@  &/blocks.14/self_attn/Concat_5_output_0)/blocks.14/self_attn/Transpose_1_output_0 /blocks.14/self_attn/Transpose_1" Transpose* perm@@@@  &/blocks.14/self_attn/Concat_6_output_0)/blocks.14/self_attn/Transpose_2_output_0 /blocks.14/self_attn/Transpose_2" Transpose* perm@@@@ w )/blocks.14/self_attn/Transpose_1_output_0%/blocks.14/self_attn/Shape_4_output_0/blocks.14/self_attn/Shape_4"Shape )/blocks.14/self_attn/Constant_30_output_0 /blocks.14/self_attn/Constant_30"Constant*F value*:B,/blocks.14/self_attn/Constant_30_attr::valueJ  %/blocks.14/self_attn/Shape_4_output_0 )/blocks.14/self_attn/Constant_30_output_0&/blocks.14/self_attn/Gather_6_output_0/blocks.14/self_attn/Gather_6"Gather* axis w )/blocks.14/self_attn/Transpose_1_output_0%/blocks.14/self_attn/Shape_5_output_0/blocks.14/self_attn/Shape_5"Shape )/blocks.14/self_attn/Constant_31_output_0 /blocks.14/self_attn/Constant_31"Constant*F value*:B,/blocks.14/self_attn/Constant_31_attr::valueJ  %/blocks.14/self_attn/Shape_5_output_0 )/blocks.14/self_attn/Constant_31_output_0&/blocks.14/self_attn/Gather_7_output_0/blocks.14/self_attn/Gather_7"Gather* axis w )/blocks.14/self_attn/Transpose_1_output_0%/blocks.14/self_attn/Shape_6_output_0/blocks.14/self_attn/Shape_6"Shape )/blocks.14/self_attn/Constant_32_output_0 /blocks.14/self_attn/Constant_32"Constant*F value*:B,/blocks.14/self_attn/Constant_32_attr::valueJ  %/blocks.14/self_attn/Shape_6_output_0 )/blocks.14/self_attn/Constant_32_output_0&/blocks.14/self_attn/Gather_8_output_0/blocks.14/self_attn/Gather_8"Gather* axis w )/blocks.14/self_attn/Transpose_1_output_0%/blocks.14/self_attn/Shape_7_output_0/blocks.14/self_attn/Shape_7"Shape )/blocks.14/self_attn/Constant_33_output_0 /blocks.14/self_attn/Constant_33"Constant*F value*:B,/blocks.14/self_attn/Constant_33_attr::valueJ  %/blocks.14/self_attn/Shape_7_output_0 )/blocks.14/self_attn/Constant_33_output_0&/blocks.14/self_attn/Gather_9_output_0/blocks.14/self_attn/Gather_9"Gather* axis )/blocks.14/self_attn/Constant_34_output_0 /blocks.14/self_attn/Constant_34"Constant*H value*<B,/blocks.14/self_attn/Constant_34_attr::valueJ  )/blocks.14/self_attn/Transpose_1_output_0 )/blocks.14/self_attn/Constant_34_output_0*/blocks.14/self_attn/Unsqueeze_12_output_0!/blocks.14/self_attn/Unsqueeze_12" Unsqueeze )/blocks.14/self_attn/Constant_35_output_0 /blocks.14/self_attn/Constant_35"Constant*H value*<B,/blocks.14/self_attn/Constant_35_attr::valueJ  &/blocks.14/self_attn/Gather_6_output_0 )/blocks.14/self_attn/Constant_35_output_0*/blocks.14/self_attn/Unsqueeze_13_output_0!/blocks.14/self_attn/Unsqueeze_13" Unsqueeze )/blocks.14/self_attn/Constant_36_output_0 /blocks.14/self_attn/Constant_36"Constant*H value*<B,/blocks.14/self_attn/Constant_36_attr::valueJ  &/blocks.14/self_attn/Gather_7_output_0 )/blocks.14/self_attn/Constant_36_output_0*/blocks.14/self_attn/Unsqueeze_14_output_0!/blocks.14/self_attn/Unsqueeze_14" Unsqueeze )/blocks.14/self_attn/Constant_37_output_0 /blocks.14/self_attn/Constant_37"Constant*H value*<B,/blocks.14/self_attn/Constant_37_attr::valueJ )/blocks.14/self_attn/Constant_38_output_0 /blocks.14/self_attn/Constant_38"Constant*H value*<B,/blocks.14/self_attn/Constant_38_attr::valueJ  &/blocks.14/self_attn/Gather_8_output_0 )/blocks.14/self_attn/Constant_38_output_0*/blocks.14/self_attn/Unsqueeze_15_output_0!/blocks.14/self_attn/Unsqueeze_15" Unsqueeze )/blocks.14/self_attn/Constant_39_output_0 /blocks.14/self_attn/Constant_39"Constant*H value*<B,/blocks.14/self_attn/Constant_39_attr::valueJ  &/blocks.14/self_attn/Gather_9_output_0 )/blocks.14/self_attn/Constant_39_output_0*/blocks.14/self_attn/Unsqueeze_16_output_0!/blocks.14/self_attn/Unsqueeze_16" Unsqueeze  */blocks.14/self_attn/Unsqueeze_13_output_0 */blocks.14/self_attn/Unsqueeze_14_output_0 )/blocks.14/self_attn/Constant_37_output_0 */blocks.14/self_attn/Unsqueeze_15_output_0 */blocks.14/self_attn/Unsqueeze_16_output_0&/blocks.14/self_attn/Concat_8_output_0/blocks.14/self_attn/Concat_8"Concat* axis )/blocks.14/self_attn/Constant_40_output_0 /blocks.14/self_attn/Constant_40"Constant*H value*<B,/blocks.14/self_attn/Constant_40_attr::valueJ  &/blocks.14/self_attn/Concat_8_output_0 )/blocks.14/self_attn/Constant_40_output_0'/blocks.14/self_attn/Reshape_3_output_0/blocks.14/self_attn/Reshape_3"Reshape* allowzero u '/blocks.14/self_attn/Reshape_3_output_0%/blocks.14/self_attn/Shape_8_output_0/blocks.14/self_attn/Shape_8"Shape  %/blocks.14/self_attn/Shape_8_output_0-/blocks.14/self_attn/ConstantOfShape_output_0$/blocks.14/self_attn/ConstantOfShape"ConstantOfShape*L value*@B0/blocks.14/self_attn/ConstantOfShape_attr::valueJ )/blocks.14/self_attn/Constant_41_output_0 /blocks.14/self_attn/Constant_41"Constant*F value*:B,/blocks.14/self_attn/Constant_41_attr::valueJ  -/blocks.14/self_attn/ConstantOfShape_output_0 )/blocks.14/self_attn/Constant_41_output_0#/blocks.14/self_attn/Mul_4_output_0/blocks.14/self_attn/Mul_4"Mul  '/blocks.14/self_attn/Reshape_3_output_0 #/blocks.14/self_attn/Mul_4_output_0#/blocks.14/self_attn/Equal_output_0/blocks.14/self_attn/Equal"Equal  #/blocks.14/self_attn/Equal_output_0 -/blocks.14/self_attn/ConstantOfShape_output_0 '/blocks.14/self_attn/Reshape_3_output_0#/blocks.14/self_attn/Where_output_0/blocks.14/self_attn/Where"Where  */blocks.14/self_attn/Unsqueeze_12_output_0 #/blocks.14/self_attn/Where_output_0$/blocks.14/self_attn/Expand_output_0/blocks.14/self_attn/Expand"Expand )/blocks.14/self_attn/Constant_42_output_0 /blocks.14/self_attn/Constant_42"Constant*F value*:B,/blocks.14/self_attn/Constant_42_attr::valueJ  &/blocks.14/self_attn/Gather_7_output_0 )/blocks.14/self_attn/Constant_42_output_0#/blocks.14/self_attn/Mul_5_output_0/blocks.14/self_attn/Mul_5"Mul fonnx::Unsqueeze_4606 Constant_6377"Constant*5 value*)BConstant_6377_attr::valueJ  &/blocks.14/self_attn/Gather_6_output_0 onnx::Unsqueeze_4606*/blocks.14/self_attn/Unsqueeze_17_output_0!/blocks.14/self_attn/Unsqueeze_17" Unsqueeze fonnx::Unsqueeze_4608 Constant_6379"Constant*5 value*)BConstant_6379_attr::valueJ  #/blocks.14/self_attn/Mul_5_output_0 onnx::Unsqueeze_4608*/blocks.14/self_attn/Unsqueeze_18_output_0!/blocks.14/self_attn/Unsqueeze_18" Unsqueeze fonnx::Unsqueeze_4610 Constant_6381"Constant*5 value*)BConstant_6381_attr::valueJ  &/blocks.14/self_attn/Gather_8_output_0 onnx::Unsqueeze_4610*/blocks.14/self_attn/Unsqueeze_19_output_0!/blocks.14/self_attn/Unsqueeze_19" Unsqueeze fonnx::Unsqueeze_4612 Constant_6383"Constant*5 value*)BConstant_6383_attr::valueJ  &/blocks.14/self_attn/Gather_9_output_0 onnx::Unsqueeze_4612*/blocks.14/self_attn/Unsqueeze_20_output_0!/blocks.14/self_attn/Unsqueeze_20" Unsqueeze  */blocks.14/self_attn/Unsqueeze_17_output_0 */blocks.14/self_attn/Unsqueeze_18_output_0 */blocks.14/self_attn/Unsqueeze_19_output_0 */blocks.14/self_attn/Unsqueeze_20_output_0&/blocks.14/self_attn/Concat_9_output_0/blocks.14/self_attn/Concat_9"Concat* axis  $/blocks.14/self_attn/Expand_output_0 &/blocks.14/self_attn/Concat_9_output_0'/blocks.14/self_attn/Reshape_4_output_0/blocks.14/self_attn/Reshape_4"Reshape* allowzero w )/blocks.14/self_attn/Transpose_2_output_0%/blocks.14/self_attn/Shape_9_output_0/blocks.14/self_attn/Shape_9"Shape )/blocks.14/self_attn/Constant_43_output_0 /blocks.14/self_attn/Constant_43"Constant*F value*:B,/blocks.14/self_attn/Constant_43_attr::valueJ  %/blocks.14/self_attn/Shape_9_output_0 )/blocks.14/self_attn/Constant_43_output_0'/blocks.14/self_attn/Gather_10_output_0/blocks.14/self_attn/Gather_10"Gather* axis y )/blocks.14/self_attn/Transpose_2_output_0&/blocks.14/self_attn/Shape_10_output_0/blocks.14/self_attn/Shape_10"Shape )/blocks.14/self_attn/Constant_44_output_0 /blocks.14/self_attn/Constant_44"Constant*F value*:B,/blocks.14/self_attn/Constant_44_attr::valueJ  &/blocks.14/self_attn/Shape_10_output_0 )/blocks.14/self_attn/Constant_44_output_0'/blocks.14/self_attn/Gather_11_output_0/blocks.14/self_attn/Gather_11"Gather* axis y )/blocks.14/self_attn/Transpose_2_output_0&/blocks.14/self_attn/Shape_11_output_0/blocks.14/self_attn/Shape_11"Shape )/blocks.14/self_attn/Constant_45_output_0 /blocks.14/self_attn/Constant_45"Constant*F value*:B,/blocks.14/self_attn/Constant_45_attr::valueJ  &/blocks.14/self_attn/Shape_11_output_0 )/blocks.14/self_attn/Constant_45_output_0'/blocks.14/self_attn/Gather_12_output_0/blocks.14/self_attn/Gather_12"Gather* axis y )/blocks.14/self_attn/Transpose_2_output_0&/blocks.14/self_attn/Shape_12_output_0/blocks.14/self_attn/Shape_12"Shape )/blocks.14/self_attn/Constant_46_output_0 /blocks.14/self_attn/Constant_46"Constant*F value*:B,/blocks.14/self_attn/Constant_46_attr::valueJ  &/blocks.14/self_attn/Shape_12_output_0 )/blocks.14/self_attn/Constant_46_output_0'/blocks.14/self_attn/Gather_13_output_0/blocks.14/self_attn/Gather_13"Gather* axis )/blocks.14/self_attn/Constant_47_output_0 /blocks.14/self_attn/Constant_47"Constant*H value*<B,/blocks.14/self_attn/Constant_47_attr::valueJ  )/blocks.14/self_attn/Transpose_2_output_0 )/blocks.14/self_attn/Constant_47_output_0*/blocks.14/self_attn/Unsqueeze_21_output_0!/blocks.14/self_attn/Unsqueeze_21" Unsqueeze )/blocks.14/self_attn/Constant_48_output_0 /blocks.14/self_attn/Constant_48"Constant*H value*<B,/blocks.14/self_attn/Constant_48_attr::valueJ  '/blocks.14/self_attn/Gather_10_output_0 )/blocks.14/self_attn/Constant_48_output_0*/blocks.14/self_attn/Unsqueeze_22_output_0!/blocks.14/self_attn/Unsqueeze_22" Unsqueeze )/blocks.14/self_attn/Constant_49_output_0 /blocks.14/self_attn/Constant_49"Constant*H value*<B,/blocks.14/self_attn/Constant_49_attr::valueJ  '/blocks.14/self_attn/Gather_11_output_0 )/blocks.14/self_attn/Constant_49_output_0*/blocks.14/self_attn/Unsqueeze_23_output_0!/blocks.14/self_attn/Unsqueeze_23" Unsqueeze )/blocks.14/self_attn/Constant_50_output_0 /blocks.14/self_attn/Constant_50"Constant*H value*<B,/blocks.14/self_attn/Constant_50_attr::valueJ )/blocks.14/self_attn/Constant_51_output_0 /blocks.14/self_attn/Constant_51"Constant*H value*<B,/blocks.14/self_attn/Constant_51_attr::valueJ  '/blocks.14/self_attn/Gather_12_output_0 )/blocks.14/self_attn/Constant_51_output_0*/blocks.14/self_attn/Unsqueeze_24_output_0!/blocks.14/self_attn/Unsqueeze_24" Unsqueeze )/blocks.14/self_attn/Constant_52_output_0 /blocks.14/self_attn/Constant_52"Constant*H value*<B,/blocks.14/self_attn/Constant_52_attr::valueJ  '/blocks.14/self_attn/Gather_13_output_0 )/blocks.14/self_attn/Constant_52_output_0*/blocks.14/self_attn/Unsqueeze_25_output_0!/blocks.14/self_attn/Unsqueeze_25" Unsqueeze  */blocks.14/self_attn/Unsqueeze_22_output_0 */blocks.14/self_attn/Unsqueeze_23_output_0 )/blocks.14/self_attn/Constant_50_output_0 */blocks.14/self_attn/Unsqueeze_24_output_0 */blocks.14/self_attn/Unsqueeze_25_output_0'/blocks.14/self_attn/Concat_10_output_0/blocks.14/self_attn/Concat_10"Concat* axis )/blocks.14/self_attn/Constant_53_output_0 /blocks.14/self_attn/Constant_53"Constant*H value*<B,/blocks.14/self_attn/Constant_53_attr::valueJ  '/blocks.14/self_attn/Concat_10_output_0 )/blocks.14/self_attn/Constant_53_output_0'/blocks.14/self_attn/Reshape_5_output_0/blocks.14/self_attn/Reshape_5"Reshape* allowzero w '/blocks.14/self_attn/Reshape_5_output_0&/blocks.14/self_attn/Shape_13_output_0/blocks.14/self_attn/Shape_13"Shape  &/blocks.14/self_attn/Shape_13_output_0//blocks.14/self_attn/ConstantOfShape_1_output_0&/blocks.14/self_attn/ConstantOfShape_1"ConstantOfShape*N value*BB2/blocks.14/self_attn/ConstantOfShape_1_attr::valueJ )/blocks.14/self_attn/Constant_54_output_0 /blocks.14/self_attn/Constant_54"Constant*F value*:B,/blocks.14/self_attn/Constant_54_attr::valueJ  //blocks.14/self_attn/ConstantOfShape_1_output_0 )/blocks.14/self_attn/Constant_54_output_0#/blocks.14/self_attn/Mul_6_output_0/blocks.14/self_attn/Mul_6"Mul  '/blocks.14/self_attn/Reshape_5_output_0 #/blocks.14/self_attn/Mul_6_output_0%/blocks.14/self_attn/Equal_1_output_0/blocks.14/self_attn/Equal_1"Equal  %/blocks.14/self_attn/Equal_1_output_0 //blocks.14/self_attn/ConstantOfShape_1_output_0 '/blocks.14/self_attn/Reshape_5_output_0%/blocks.14/self_attn/Where_1_output_0/blocks.14/self_attn/Where_1"Where  */blocks.14/self_attn/Unsqueeze_21_output_0 %/blocks.14/self_attn/Where_1_output_0&/blocks.14/self_attn/Expand_1_output_0/blocks.14/self_attn/Expand_1"Expand )/blocks.14/self_attn/Constant_55_output_0 /blocks.14/self_attn/Constant_55"Constant*F value*:B,/blocks.14/self_attn/Constant_55_attr::valueJ  '/blocks.14/self_attn/Gather_11_output_0 )/blocks.14/self_attn/Constant_55_output_0#/blocks.14/self_attn/Mul_7_output_0/blocks.14/self_attn/Mul_7"Mul fonnx::Unsqueeze_4652 Constant_6422"Constant*5 value*)BConstant_6422_attr::valueJ  '/blocks.14/self_attn/Gather_10_output_0 onnx::Unsqueeze_4652*/blocks.14/self_attn/Unsqueeze_26_output_0!/blocks.14/self_attn/Unsqueeze_26" Unsqueeze fonnx::Unsqueeze_4654 Constant_6424"Constant*5 value*)BConstant_6424_attr::valueJ  #/blocks.14/self_attn/Mul_7_output_0 onnx::Unsqueeze_4654*/blocks.14/self_attn/Unsqueeze_27_output_0!/blocks.14/self_attn/Unsqueeze_27" Unsqueeze fonnx::Unsqueeze_4656 Constant_6426"Constant*5 value*)BConstant_6426_attr::valueJ  '/blocks.14/self_attn/Gather_12_output_0 onnx::Unsqueeze_4656*/blocks.14/self_attn/Unsqueeze_28_output_0!/blocks.14/self_attn/Unsqueeze_28" Unsqueeze fonnx::Unsqueeze_4658 Constant_6428"Constant*5 value*)BConstant_6428_attr::valueJ  '/blocks.14/self_attn/Gather_13_output_0 onnx::Unsqueeze_4658*/blocks.14/self_attn/Unsqueeze_29_output_0!/blocks.14/self_attn/Unsqueeze_29" Unsqueeze  */blocks.14/self_attn/Unsqueeze_26_output_0 */blocks.14/self_attn/Unsqueeze_27_output_0 */blocks.14/self_attn/Unsqueeze_28_output_0 */blocks.14/self_attn/Unsqueeze_29_output_0'/blocks.14/self_attn/Concat_11_output_0/blocks.14/self_attn/Concat_11"Concat* axis  &/blocks.14/self_attn/Expand_1_output_0 '/blocks.14/self_attn/Concat_11_output_0'/blocks.14/self_attn/Reshape_6_output_0/blocks.14/self_attn/Reshape_6"Reshape* allowzero  '/blocks.14/self_attn/Transpose_output_0 '/blocks.14/self_attn/Reshape_4_output_0$/blocks.14/self_attn/MatMul_output_0/blocks.14/self_attn/MatMul"MatMul )/blocks.14/self_attn/Constant_56_output_0 /blocks.14/self_attn/Constant_56"Constant*B value*6B,/blocks.14/self_attn/Constant_56_attr::valueJ5A  $/blocks.14/self_attn/MatMul_output_0 )/blocks.14/self_attn/Constant_56_output_0#/blocks.14/self_attn/Div_2_output_0/blocks.14/self_attn/Div_2"Div { #/blocks.14/self_attn/Div_2_output_0 attention_mask#/blocks.14/self_attn/Add_2_output_0/blocks.14/self_attn/Add_2"Add  #/blocks.14/self_attn/Add_2_output_0%/blocks.14/self_attn/Softmax_output_0/blocks.14/self_attn/Softmax"Softmax* axis { %/blocks.14/self_attn/Softmax_output_0$/blocks.14/self_attn/Cast_4_output_0/blocks.14/self_attn/Cast_4"Cast* to  $/blocks.14/self_attn/Cast_4_output_0 '/blocks.14/self_attn/Reshape_6_output_0&/blocks.14/self_attn/MatMul_1_output_0/blocks.14/self_attn/MatMul_1"MatMul  &/blocks.14/self_attn/MatMul_1_output_0)/blocks.14/self_attn/Transpose_3_output_0 /blocks.14/self_attn/Transpose_3" Transpose* perm@@@@ fonnx::Unsqueeze_4670 Constant_6440"Constant*5 value*)BConstant_6440_attr::valueJ  $/blocks.14/self_attn/Gather_output_0 onnx::Unsqueeze_4670*/blocks.14/self_attn/Unsqueeze_30_output_0!/blocks.14/self_attn/Unsqueeze_30" Unsqueeze fonnx::Unsqueeze_4672 Constant_6442"Constant*5 value*)BConstant_6442_attr::valueJ  &/blocks.14/self_attn/Gather_1_output_0 onnx::Unsqueeze_4672*/blocks.14/self_attn/Unsqueeze_31_output_0!/blocks.14/self_attn/Unsqueeze_31" Unsqueeze )/blocks.14/self_attn/Constant_57_output_0 /blocks.14/self_attn/Constant_57"Constant*H value*<B,/blocks.14/self_attn/Constant_57_attr::valueJ  */blocks.14/self_attn/Unsqueeze_30_output_0 */blocks.14/self_attn/Unsqueeze_31_output_0 )/blocks.14/self_attn/Constant_57_output_0'/blocks.14/self_attn/Concat_12_output_0/blocks.14/self_attn/Concat_12"Concat* axis  )/blocks.14/self_attn/Transpose_3_output_0 '/blocks.14/self_attn/Concat_12_output_0'/blocks.14/self_attn/Reshape_7_output_0/blocks.14/self_attn/Reshape_7"Reshape* allowzero  '/blocks.14/self_attn/Reshape_7_output_0 onnx::MatMul_8981+/blocks.14/self_attn/o_proj/MatMul_output_0"/blocks.14/self_attn/o_proj/MatMul"MatMul  */blocks.14/input_layernorm/Cast_1_output_0 +/blocks.14/self_attn/o_proj/MatMul_output_0/blocks.14/Add_output_0/blocks.14/Add"Add  /blocks.14/Add_output_01/blocks.14/post_attention_layernorm/Cast_output_0(/blocks.14/post_attention_layernorm/Cast"Cast* to 5/blocks.14/post_attention_layernorm/Constant_output_0,/blocks.14/post_attention_layernorm/Constant"Constant*N value*BB8/blocks.14/post_attention_layernorm/Constant_attr::valueJ@  1/blocks.14/post_attention_layernorm/Cast_output_0 5/blocks.14/post_attention_layernorm/Constant_output_00/blocks.14/post_attention_layernorm/Pow_output_0'/blocks.14/post_attention_layernorm/Pow"Pow  0/blocks.14/post_attention_layernorm/Pow_output_07/blocks.14/post_attention_layernorm/ReduceMean_output_0./blocks.14/post_attention_layernorm/ReduceMean" ReduceMean* axes@* keepdims 7/blocks.14/post_attention_layernorm/Constant_1_output_0./blocks.14/post_attention_layernorm/Constant_1"Constant*P value*DB:/blocks.14/post_attention_layernorm/Constant_1_attr::valueJ75  7/blocks.14/post_attention_layernorm/ReduceMean_output_0 7/blocks.14/post_attention_layernorm/Constant_1_output_00/blocks.14/post_attention_layernorm/Add_output_0'/blocks.14/post_attention_layernorm/Add"Add  0/blocks.14/post_attention_layernorm/Add_output_01/blocks.14/post_attention_layernorm/Sqrt_output_0(/blocks.14/post_attention_layernorm/Sqrt"Sqrt 7/blocks.14/post_attention_layernorm/Constant_2_output_0./blocks.14/post_attention_layernorm/Constant_2"Constant*P value*DB:/blocks.14/post_attention_layernorm/Constant_2_attr::valueJ?  7/blocks.14/post_attention_layernorm/Constant_2_output_0 1/blocks.14/post_attention_layernorm/Sqrt_output_00/blocks.14/post_attention_layernorm/Div_output_0'/blocks.14/post_attention_layernorm/Div"Div  1/blocks.14/post_attention_layernorm/Cast_output_03/blocks.14/post_attention_layernorm/Cast_1_output_0*/blocks.14/post_attention_layernorm/Cast_1"Cast* to  3/blocks.14/post_attention_layernorm/Cast_1_output_0 0/blocks.14/post_attention_layernorm/Div_output_00/blocks.14/post_attention_layernorm/Mul_output_0'/blocks.14/post_attention_layernorm/Mul"Mul  0/blocks.14/post_attention_layernorm/Mul_output_0 )blocks.14.post_attention_layernorm.weight2/blocks.14/post_attention_layernorm/Mul_1_output_0)/blocks.14/post_attention_layernorm/Mul_1"Mul  2/blocks.14/post_attention_layernorm/Mul_1_output_03/blocks.14/post_attention_layernorm/Cast_2_output_0*/blocks.14/post_attention_layernorm/Cast_2"Cast* to  3/blocks.14/post_attention_layernorm/Cast_2_output_0 onnx::MatMul_8982(/blocks.14/mlp/gate_proj/MatMul_output_0/blocks.14/mlp/gate_proj/MatMul"MatMul z (/blocks.14/mlp/gate_proj/MatMul_output_0&/blocks.14/mlp/act_fn/Sigmoid_output_0/blocks.14/mlp/act_fn/Sigmoid"Sigmoid  (/blocks.14/mlp/gate_proj/MatMul_output_0 &/blocks.14/mlp/act_fn/Sigmoid_output_0"/blocks.14/mlp/act_fn/Mul_output_0/blocks.14/mlp/act_fn/Mul"Mul  3/blocks.14/post_attention_layernorm/Cast_2_output_0 onnx::MatMul_8983&/blocks.14/mlp/up_proj/MatMul_output_0/blocks.14/mlp/up_proj/MatMul"MatMul  "/blocks.14/mlp/act_fn/Mul_output_0 &/blocks.14/mlp/up_proj/MatMul_output_0/blocks.14/mlp/Mul_output_0/blocks.14/mlp/Mul"Mul  /blocks.14/mlp/Mul_output_0 onnx::MatMul_8984(/blocks.14/mlp/down_proj/MatMul_output_0/blocks.14/mlp/down_proj/MatMul"MatMul  3/blocks.14/post_attention_layernorm/Cast_1_output_0 (/blocks.14/mlp/down_proj/MatMul_output_0/blocks.14/Add_1_output_0/blocks.14/Add_1"Add `/Constant_8_output_0 /Constant_8"Constant*1 value*%B/Constant_8_attr::valueJ ] past_key_values /Constant_8_output_0/Gather_15_output_0 /Gather_15"Gather* axis /blocks.15/Constant_output_0/blocks.15/Constant"Constant*K value*?B/blocks.15/Constant_attr::valueJ  /blocks.14/Add_1_output_0 /blocks.15/Constant_output_0/blocks.15/Reshape_output_0/blocks.15/Reshape"Reshape* allowzero y /blocks.15/Reshape_output_0(/blocks.15/input_layernorm/Cast_output_0/blocks.15/input_layernorm/Cast"Cast* to ,/blocks.15/input_layernorm/Constant_output_0#/blocks.15/input_layernorm/Constant"Constant*E value*9B//blocks.15/input_layernorm/Constant_attr::valueJ@  (/blocks.15/input_layernorm/Cast_output_0 ,/blocks.15/input_layernorm/Constant_output_0'/blocks.15/input_layernorm/Pow_output_0/blocks.15/input_layernorm/Pow"Pow  '/blocks.15/input_layernorm/Pow_output_0./blocks.15/input_layernorm/ReduceMean_output_0%/blocks.15/input_layernorm/ReduceMean" ReduceMean* axes@* keepdims ./blocks.15/input_layernorm/Constant_1_output_0%/blocks.15/input_layernorm/Constant_1"Constant*G value*;B1/blocks.15/input_layernorm/Constant_1_attr::valueJ75  ./blocks.15/input_layernorm/ReduceMean_output_0 ./blocks.15/input_layernorm/Constant_1_output_0'/blocks.15/input_layernorm/Add_output_0/blocks.15/input_layernorm/Add"Add z '/blocks.15/input_layernorm/Add_output_0(/blocks.15/input_layernorm/Sqrt_output_0/blocks.15/input_layernorm/Sqrt"Sqrt ./blocks.15/input_layernorm/Constant_2_output_0%/blocks.15/input_layernorm/Constant_2"Constant*G value*;B1/blocks.15/input_layernorm/Constant_2_attr::valueJ?  ./blocks.15/input_layernorm/Constant_2_output_0 (/blocks.15/input_layernorm/Sqrt_output_0'/blocks.15/input_layernorm/Div_output_0/blocks.15/input_layernorm/Div"Div  (/blocks.15/input_layernorm/Cast_output_0*/blocks.15/input_layernorm/Cast_1_output_0!/blocks.15/input_layernorm/Cast_1"Cast* to  */blocks.15/input_layernorm/Cast_1_output_0 '/blocks.15/input_layernorm/Div_output_0'/blocks.15/input_layernorm/Mul_output_0/blocks.15/input_layernorm/Mul"Mul  '/blocks.15/input_layernorm/Mul_output_0 blocks.15.input_layernorm.weight)/blocks.15/input_layernorm/Mul_1_output_0 /blocks.15/input_layernorm/Mul_1"Mul  )/blocks.15/input_layernorm/Mul_1_output_0*/blocks.15/input_layernorm/Cast_2_output_0!/blocks.15/input_layernorm/Cast_2"Cast* to t */blocks.15/input_layernorm/Cast_2_output_0#/blocks.15/self_attn/Shape_output_0/blocks.15/self_attn/Shape"Shape &/blocks.15/self_attn/Constant_output_0/blocks.15/self_attn/Constant"Constant*C value*7B)/blocks.15/self_attn/Constant_attr::valueJ  #/blocks.15/self_attn/Shape_output_0 &/blocks.15/self_attn/Constant_output_0$/blocks.15/self_attn/Gather_output_0/blocks.15/self_attn/Gather"Gather* axis x */blocks.15/input_layernorm/Cast_2_output_0%/blocks.15/self_attn/Shape_1_output_0/blocks.15/self_attn/Shape_1"Shape (/blocks.15/self_attn/Constant_1_output_0/blocks.15/self_attn/Constant_1"Constant*E value*9B+/blocks.15/self_attn/Constant_1_attr::valueJ  %/blocks.15/self_attn/Shape_1_output_0 (/blocks.15/self_attn/Constant_1_output_0&/blocks.15/self_attn/Gather_1_output_0/blocks.15/self_attn/Gather_1"Gather* axis  */blocks.15/input_layernorm/Cast_2_output_0 onnx::MatMul_8985+/blocks.15/self_attn/q_proj/MatMul_output_0"/blocks.15/self_attn/q_proj/MatMul"MatMul  */blocks.15/input_layernorm/Cast_2_output_0 onnx::MatMul_8986+/blocks.15/self_attn/k_proj/MatMul_output_0"/blocks.15/self_attn/k_proj/MatMul"MatMul  */blocks.15/input_layernorm/Cast_2_output_0 onnx::MatMul_8987+/blocks.15/self_attn/v_proj/MatMul_output_0"/blocks.15/self_attn/v_proj/MatMul"MatMul fonnx::Unsqueeze_4733 Constant_6495"Constant*5 value*)BConstant_6495_attr::valueJ  $/blocks.15/self_attn/Gather_output_0 onnx::Unsqueeze_4733'/blocks.15/self_attn/Unsqueeze_output_0/blocks.15/self_attn/Unsqueeze" Unsqueeze fonnx::Unsqueeze_4735 Constant_6497"Constant*5 value*)BConstant_6497_attr::valueJ  &/blocks.15/self_attn/Gather_1_output_0 onnx::Unsqueeze_4735)/blocks.15/self_attn/Unsqueeze_1_output_0 /blocks.15/self_attn/Unsqueeze_1" Unsqueeze (/blocks.15/self_attn/Constant_2_output_0/blocks.15/self_attn/Constant_2"Constant*G value*;B+/blocks.15/self_attn/Constant_2_attr::valueJ (/blocks.15/self_attn/Constant_3_output_0/blocks.15/self_attn/Constant_3"Constant*G value*;B+/blocks.15/self_attn/Constant_3_attr::valueJ  '/blocks.15/self_attn/Unsqueeze_output_0 )/blocks.15/self_attn/Unsqueeze_1_output_0 (/blocks.15/self_attn/Constant_2_output_0 (/blocks.15/self_attn/Constant_3_output_0$/blocks.15/self_attn/Concat_output_0/blocks.15/self_attn/Concat"Concat* axis  +/blocks.15/self_attn/q_proj/MatMul_output_0 $/blocks.15/self_attn/Concat_output_0%/blocks.15/self_attn/Reshape_output_0/blocks.15/self_attn/Reshape"Reshape* allowzero fonnx::Unsqueeze_4743 Constant_6503"Constant*5 value*)BConstant_6503_attr::valueJ  $/blocks.15/self_attn/Gather_output_0 onnx::Unsqueeze_4743)/blocks.15/self_attn/Unsqueeze_2_output_0 /blocks.15/self_attn/Unsqueeze_2" Unsqueeze fonnx::Unsqueeze_4745 Constant_6505"Constant*5 value*)BConstant_6505_attr::valueJ  &/blocks.15/self_attn/Gather_1_output_0 onnx::Unsqueeze_4745)/blocks.15/self_attn/Unsqueeze_3_output_0 /blocks.15/self_attn/Unsqueeze_3" Unsqueeze (/blocks.15/self_attn/Constant_4_output_0/blocks.15/self_attn/Constant_4"Constant*G value*;B+/blocks.15/self_attn/Constant_4_attr::valueJ (/blocks.15/self_attn/Constant_5_output_0/blocks.15/self_attn/Constant_5"Constant*G value*;B+/blocks.15/self_attn/Constant_5_attr::valueJ  )/blocks.15/self_attn/Unsqueeze_2_output_0 )/blocks.15/self_attn/Unsqueeze_3_output_0 (/blocks.15/self_attn/Constant_4_output_0 (/blocks.15/self_attn/Constant_5_output_0&/blocks.15/self_attn/Concat_1_output_0/blocks.15/self_attn/Concat_1"Concat* axis fonnx::Unsqueeze_4752 Constant_6510"Constant*5 value*)BConstant_6510_attr::valueJ  $/blocks.15/self_attn/Gather_output_0 onnx::Unsqueeze_4752)/blocks.15/self_attn/Unsqueeze_4_output_0 /blocks.15/self_attn/Unsqueeze_4" Unsqueeze fonnx::Unsqueeze_4754 Constant_6512"Constant*5 value*)BConstant_6512_attr::valueJ  &/blocks.15/self_attn/Gather_1_output_0 onnx::Unsqueeze_4754)/blocks.15/self_attn/Unsqueeze_5_output_0 /blocks.15/self_attn/Unsqueeze_5" Unsqueeze (/blocks.15/self_attn/Constant_6_output_0/blocks.15/self_attn/Constant_6"Constant*G value*;B+/blocks.15/self_attn/Constant_6_attr::valueJ (/blocks.15/self_attn/Constant_7_output_0/blocks.15/self_attn/Constant_7"Constant*G value*;B+/blocks.15/self_attn/Constant_7_attr::valueJ  )/blocks.15/self_attn/Unsqueeze_4_output_0 )/blocks.15/self_attn/Unsqueeze_5_output_0 (/blocks.15/self_attn/Constant_6_output_0 (/blocks.15/self_attn/Constant_7_output_0&/blocks.15/self_attn/Concat_2_output_0/blocks.15/self_attn/Concat_2"Concat* axis  +/blocks.15/self_attn/k_proj/MatMul_output_0 &/blocks.15/self_attn/Concat_1_output_0'/blocks.15/self_attn/Reshape_1_output_0/blocks.15/self_attn/Reshape_1"Reshape* allowzero  +/blocks.15/self_attn/v_proj/MatMul_output_0 &/blocks.15/self_attn/Concat_2_output_0'/blocks.15/self_attn/Reshape_2_output_0/blocks.15/self_attn/Reshape_2"Reshape* allowzero  %/blocks.15/self_attn/Reshape_output_0)/blocks.15/self_attn/q_norm/Cast_output_0 /blocks.15/self_attn/q_norm/Cast"Cast* to -/blocks.15/self_attn/q_norm/Constant_output_0$/blocks.15/self_attn/q_norm/Constant"Constant*F value*:B0/blocks.15/self_attn/q_norm/Constant_attr::valueJ@  )/blocks.15/self_attn/q_norm/Cast_output_0 -/blocks.15/self_attn/q_norm/Constant_output_0(/blocks.15/self_attn/q_norm/Pow_output_0/blocks.15/self_attn/q_norm/Pow"Pow  (/blocks.15/self_attn/q_norm/Pow_output_0//blocks.15/self_attn/q_norm/ReduceMean_output_0&/blocks.15/self_attn/q_norm/ReduceMean" ReduceMean* axes@* keepdims //blocks.15/self_attn/q_norm/Constant_1_output_0&/blocks.15/self_attn/q_norm/Constant_1"Constant*H value*<B2/blocks.15/self_attn/q_norm/Constant_1_attr::valueJ75  //blocks.15/self_attn/q_norm/ReduceMean_output_0 //blocks.15/self_attn/q_norm/Constant_1_output_0(/blocks.15/self_attn/q_norm/Add_output_0/blocks.15/self_attn/q_norm/Add"Add } (/blocks.15/self_attn/q_norm/Add_output_0)/blocks.15/self_attn/q_norm/Sqrt_output_0 /blocks.15/self_attn/q_norm/Sqrt"Sqrt //blocks.15/self_attn/q_norm/Constant_2_output_0&/blocks.15/self_attn/q_norm/Constant_2"Constant*H value*<B2/blocks.15/self_attn/q_norm/Constant_2_attr::valueJ?  //blocks.15/self_attn/q_norm/Constant_2_output_0 )/blocks.15/self_attn/q_norm/Sqrt_output_0(/blocks.15/self_attn/q_norm/Div_output_0/blocks.15/self_attn/q_norm/Div"Div  )/blocks.15/self_attn/q_norm/Cast_output_0+/blocks.15/self_attn/q_norm/Cast_1_output_0"/blocks.15/self_attn/q_norm/Cast_1"Cast* to  +/blocks.15/self_attn/q_norm/Cast_1_output_0 (/blocks.15/self_attn/q_norm/Div_output_0(/blocks.15/self_attn/q_norm/Mul_output_0/blocks.15/self_attn/q_norm/Mul"Mul  (/blocks.15/self_attn/q_norm/Mul_output_0 !blocks.15.self_attn.q_norm.weight*/blocks.15/self_attn/q_norm/Mul_1_output_0!/blocks.15/self_attn/q_norm/Mul_1"Mul  */blocks.15/self_attn/q_norm/Mul_1_output_0+/blocks.15/self_attn/q_norm/Cast_2_output_0"/blocks.15/self_attn/q_norm/Cast_2"Cast* to  '/blocks.15/self_attn/Reshape_1_output_0)/blocks.15/self_attn/k_norm/Cast_output_0 /blocks.15/self_attn/k_norm/Cast"Cast* to -/blocks.15/self_attn/k_norm/Constant_output_0$/blocks.15/self_attn/k_norm/Constant"Constant*F value*:B0/blocks.15/self_attn/k_norm/Constant_attr::valueJ@  )/blocks.15/self_attn/k_norm/Cast_output_0 -/blocks.15/self_attn/k_norm/Constant_output_0(/blocks.15/self_attn/k_norm/Pow_output_0/blocks.15/self_attn/k_norm/Pow"Pow  (/blocks.15/self_attn/k_norm/Pow_output_0//blocks.15/self_attn/k_norm/ReduceMean_output_0&/blocks.15/self_attn/k_norm/ReduceMean" ReduceMean* axes@* keepdims //blocks.15/self_attn/k_norm/Constant_1_output_0&/blocks.15/self_attn/k_norm/Constant_1"Constant*H value*<B2/blocks.15/self_attn/k_norm/Constant_1_attr::valueJ75  //blocks.15/self_attn/k_norm/ReduceMean_output_0 //blocks.15/self_attn/k_norm/Constant_1_output_0(/blocks.15/self_attn/k_norm/Add_output_0/blocks.15/self_attn/k_norm/Add"Add } (/blocks.15/self_attn/k_norm/Add_output_0)/blocks.15/self_attn/k_norm/Sqrt_output_0 /blocks.15/self_attn/k_norm/Sqrt"Sqrt //blocks.15/self_attn/k_norm/Constant_2_output_0&/blocks.15/self_attn/k_norm/Constant_2"Constant*H value*<B2/blocks.15/self_attn/k_norm/Constant_2_attr::valueJ?  //blocks.15/self_attn/k_norm/Constant_2_output_0 )/blocks.15/self_attn/k_norm/Sqrt_output_0(/blocks.15/self_attn/k_norm/Div_output_0/blocks.15/self_attn/k_norm/Div"Div  )/blocks.15/self_attn/k_norm/Cast_output_0+/blocks.15/self_attn/k_norm/Cast_1_output_0"/blocks.15/self_attn/k_norm/Cast_1"Cast* to  +/blocks.15/self_attn/k_norm/Cast_1_output_0 (/blocks.15/self_attn/k_norm/Div_output_0(/blocks.15/self_attn/k_norm/Mul_output_0/blocks.15/self_attn/k_norm/Mul"Mul  (/blocks.15/self_attn/k_norm/Mul_output_0 !blocks.15.self_attn.k_norm.weight*/blocks.15/self_attn/k_norm/Mul_1_output_0!/blocks.15/self_attn/k_norm/Mul_1"Mul  */blocks.15/self_attn/k_norm/Mul_1_output_0+/blocks.15/self_attn/k_norm/Cast_2_output_0"/blocks.15/self_attn/k_norm/Cast_2"Cast* to  +/blocks.15/self_attn/q_norm/Cast_2_output_0 %/blocks.0/self_attn/Gather_2_output_0!/blocks.15/self_attn/Mul_output_0/blocks.15/self_attn/Mul"Mul y +/blocks.15/self_attn/q_norm/Cast_2_output_0%/blocks.15/self_attn/Shape_2_output_0/blocks.15/self_attn/Shape_2"Shape (/blocks.15/self_attn/Constant_8_output_0/blocks.15/self_attn/Constant_8"Constant*E value*9B+/blocks.15/self_attn/Constant_8_attr::valueJ  %/blocks.15/self_attn/Shape_2_output_0 (/blocks.15/self_attn/Constant_8_output_0&/blocks.15/self_attn/Gather_2_output_0/blocks.15/self_attn/Gather_2"Gather* axis (/blocks.15/self_attn/Constant_9_output_0/blocks.15/self_attn/Constant_9"Constant*E value*9B+/blocks.15/self_attn/Constant_9_attr::valueJ  &/blocks.15/self_attn/Gather_2_output_0 (/blocks.15/self_attn/Constant_9_output_0!/blocks.15/self_attn/Div_output_0/blocks.15/self_attn/Div"Div s !/blocks.15/self_attn/Div_output_0"/blocks.15/self_attn/Cast_output_0/blocks.15/self_attn/Cast"Cast* to x "/blocks.15/self_attn/Cast_output_0$/blocks.15/self_attn/Cast_1_output_0/blocks.15/self_attn/Cast_1"Cast* to )/blocks.15/self_attn/Constant_10_output_0 /blocks.15/self_attn/Constant_10"Constant*H value*<B,/blocks.15/self_attn/Constant_10_attr::valueJ )/blocks.15/self_attn/Constant_11_output_0 /blocks.15/self_attn/Constant_11"Constant*H value*<B,/blocks.15/self_attn/Constant_11_attr::valueJ )/blocks.15/self_attn/Constant_12_output_0 /blocks.15/self_attn/Constant_12"Constant*H value*<B,/blocks.15/self_attn/Constant_12_attr::valueJ  $/blocks.15/self_attn/Cast_1_output_0 )/blocks.15/self_attn/Constant_12_output_0)/blocks.15/self_attn/Unsqueeze_6_output_0 /blocks.15/self_attn/Unsqueeze_6" Unsqueeze )/blocks.15/self_attn/Constant_13_output_0 /blocks.15/self_attn/Constant_13"Constant*H value*<B,/blocks.15/self_attn/Constant_13_attr::valueJ  +/blocks.15/self_attn/q_norm/Cast_2_output_0 )/blocks.15/self_attn/Constant_11_output_0 )/blocks.15/self_attn/Unsqueeze_6_output_0 )/blocks.15/self_attn/Constant_10_output_0 )/blocks.15/self_attn/Constant_13_output_0#/blocks.15/self_attn/Slice_output_0/blocks.15/self_attn/Slice"Slice )/blocks.15/self_attn/Constant_14_output_0 /blocks.15/self_attn/Constant_14"Constant*H value*<B,/blocks.15/self_attn/Constant_14_attr::valueJ )/blocks.15/self_attn/Constant_15_output_0 /blocks.15/self_attn/Constant_15"Constant*H value*<B,/blocks.15/self_attn/Constant_15_attr::valueJ  $/blocks.15/self_attn/Cast_1_output_0 )/blocks.15/self_attn/Constant_15_output_0)/blocks.15/self_attn/Unsqueeze_7_output_0 /blocks.15/self_attn/Unsqueeze_7" Unsqueeze )/blocks.15/self_attn/Constant_16_output_0 /blocks.15/self_attn/Constant_16"Constant*H value*<B,/blocks.15/self_attn/Constant_16_attr::valueJ )/blocks.15/self_attn/Constant_17_output_0 /blocks.15/self_attn/Constant_17"Constant*H value*<B,/blocks.15/self_attn/Constant_17_attr::valueJ  +/blocks.15/self_attn/q_norm/Cast_2_output_0 )/blocks.15/self_attn/Unsqueeze_7_output_0 )/blocks.15/self_attn/Constant_16_output_0 )/blocks.15/self_attn/Constant_14_output_0 )/blocks.15/self_attn/Constant_17_output_0%/blocks.15/self_attn/Slice_1_output_0/blocks.15/self_attn/Slice_1"Slice i %/blocks.15/self_attn/Slice_1_output_0!/blocks.15/self_attn/Neg_output_0/blocks.15/self_attn/Neg"Neg  !/blocks.15/self_attn/Neg_output_0 #/blocks.15/self_attn/Slice_output_0&/blocks.15/self_attn/Concat_3_output_0/blocks.15/self_attn/Concat_3"Concat* axis  &/blocks.15/self_attn/Concat_3_output_0 %/blocks.0/self_attn/Gather_3_output_0#/blocks.15/self_attn/Mul_1_output_0/blocks.15/self_attn/Mul_1"Mul  !/blocks.15/self_attn/Mul_output_0 #/blocks.15/self_attn/Mul_1_output_0!/blocks.15/self_attn/Add_output_0/blocks.15/self_attn/Add"Add  +/blocks.15/self_attn/k_norm/Cast_2_output_0 %/blocks.0/self_attn/Gather_2_output_0#/blocks.15/self_attn/Mul_2_output_0/blocks.15/self_attn/Mul_2"Mul y +/blocks.15/self_attn/k_norm/Cast_2_output_0%/blocks.15/self_attn/Shape_3_output_0/blocks.15/self_attn/Shape_3"Shape )/blocks.15/self_attn/Constant_18_output_0 /blocks.15/self_attn/Constant_18"Constant*F value*:B,/blocks.15/self_attn/Constant_18_attr::valueJ  %/blocks.15/self_attn/Shape_3_output_0 )/blocks.15/self_attn/Constant_18_output_0&/blocks.15/self_attn/Gather_3_output_0/blocks.15/self_attn/Gather_3"Gather* axis )/blocks.15/self_attn/Constant_19_output_0 /blocks.15/self_attn/Constant_19"Constant*F value*:B,/blocks.15/self_attn/Constant_19_attr::valueJ  &/blocks.15/self_attn/Gather_3_output_0 )/blocks.15/self_attn/Constant_19_output_0#/blocks.15/self_attn/Div_1_output_0/blocks.15/self_attn/Div_1"Div y #/blocks.15/self_attn/Div_1_output_0$/blocks.15/self_attn/Cast_2_output_0/blocks.15/self_attn/Cast_2"Cast* to z $/blocks.15/self_attn/Cast_2_output_0$/blocks.15/self_attn/Cast_3_output_0/blocks.15/self_attn/Cast_3"Cast* to )/blocks.15/self_attn/Constant_20_output_0 /blocks.15/self_attn/Constant_20"Constant*H value*<B,/blocks.15/self_attn/Constant_20_attr::valueJ )/blocks.15/self_attn/Constant_21_output_0 /blocks.15/self_attn/Constant_21"Constant*H value*<B,/blocks.15/self_attn/Constant_21_attr::valueJ )/blocks.15/self_attn/Constant_22_output_0 /blocks.15/self_attn/Constant_22"Constant*H value*<B,/blocks.15/self_attn/Constant_22_attr::valueJ  $/blocks.15/self_attn/Cast_3_output_0 )/blocks.15/self_attn/Constant_22_output_0)/blocks.15/self_attn/Unsqueeze_8_output_0 /blocks.15/self_attn/Unsqueeze_8" Unsqueeze )/blocks.15/self_attn/Constant_23_output_0 /blocks.15/self_attn/Constant_23"Constant*H value*<B,/blocks.15/self_attn/Constant_23_attr::valueJ  +/blocks.15/self_attn/k_norm/Cast_2_output_0 )/blocks.15/self_attn/Constant_21_output_0 )/blocks.15/self_attn/Unsqueeze_8_output_0 )/blocks.15/self_attn/Constant_20_output_0 )/blocks.15/self_attn/Constant_23_output_0%/blocks.15/self_attn/Slice_2_output_0/blocks.15/self_attn/Slice_2"Slice )/blocks.15/self_attn/Constant_24_output_0 /blocks.15/self_attn/Constant_24"Constant*H value*<B,/blocks.15/self_attn/Constant_24_attr::valueJ )/blocks.15/self_attn/Constant_25_output_0 /blocks.15/self_attn/Constant_25"Constant*H value*<B,/blocks.15/self_attn/Constant_25_attr::valueJ  $/blocks.15/self_attn/Cast_3_output_0 )/blocks.15/self_attn/Constant_25_output_0)/blocks.15/self_attn/Unsqueeze_9_output_0 /blocks.15/self_attn/Unsqueeze_9" Unsqueeze )/blocks.15/self_attn/Constant_26_output_0 /blocks.15/self_attn/Constant_26"Constant*H value*<B,/blocks.15/self_attn/Constant_26_attr::valueJ )/blocks.15/self_attn/Constant_27_output_0 /blocks.15/self_attn/Constant_27"Constant*H value*<B,/blocks.15/self_attn/Constant_27_attr::valueJ  +/blocks.15/self_attn/k_norm/Cast_2_output_0 )/blocks.15/self_attn/Unsqueeze_9_output_0 )/blocks.15/self_attn/Constant_26_output_0 )/blocks.15/self_attn/Constant_24_output_0 )/blocks.15/self_attn/Constant_27_output_0%/blocks.15/self_attn/Slice_3_output_0/blocks.15/self_attn/Slice_3"Slice m %/blocks.15/self_attn/Slice_3_output_0#/blocks.15/self_attn/Neg_1_output_0/blocks.15/self_attn/Neg_1"Neg  #/blocks.15/self_attn/Neg_1_output_0 %/blocks.15/self_attn/Slice_2_output_0&/blocks.15/self_attn/Concat_4_output_0/blocks.15/self_attn/Concat_4"Concat* axis  &/blocks.15/self_attn/Concat_4_output_0 %/blocks.0/self_attn/Gather_3_output_0#/blocks.15/self_attn/Mul_3_output_0/blocks.15/self_attn/Mul_3"Mul  #/blocks.15/self_attn/Mul_2_output_0 #/blocks.15/self_attn/Mul_3_output_0#/blocks.15/self_attn/Add_1_output_0/blocks.15/self_attn/Add_1"Add  /Gather_15_output_0 /rotary/Constant_3_output_0&/blocks.15/self_attn/Gather_4_output_0/blocks.15/self_attn/Gather_4"Gather* axis  /Gather_15_output_0 /rotary/Constant_8_output_0&/blocks.15/self_attn/Gather_5_output_0/blocks.15/self_attn/Gather_5"Gather* axis  &/blocks.15/self_attn/Gather_4_output_0 #/blocks.15/self_attn/Add_1_output_0&/blocks.15/self_attn/Concat_5_output_0/blocks.15/self_attn/Concat_5"Concat* axis  &/blocks.15/self_attn/Gather_5_output_0 '/blocks.15/self_attn/Reshape_2_output_0&/blocks.15/self_attn/Concat_6_output_0/blocks.15/self_attn/Concat_6"Concat* axis )/blocks.15/self_attn/Constant_28_output_0 /blocks.15/self_attn/Constant_28"Constant*H value*<B,/blocks.15/self_attn/Constant_28_attr::valueJ  &/blocks.15/self_attn/Concat_5_output_0 )/blocks.15/self_attn/Constant_28_output_0*/blocks.15/self_attn/Unsqueeze_10_output_0!/blocks.15/self_attn/Unsqueeze_10" Unsqueeze )/blocks.15/self_attn/Constant_29_output_0 /blocks.15/self_attn/Constant_29"Constant*H value*<B,/blocks.15/self_attn/Constant_29_attr::valueJ  &/blocks.15/self_attn/Concat_6_output_0 )/blocks.15/self_attn/Constant_29_output_0*/blocks.15/self_attn/Unsqueeze_11_output_0!/blocks.15/self_attn/Unsqueeze_11" Unsqueeze  */blocks.15/self_attn/Unsqueeze_10_output_0 */blocks.15/self_attn/Unsqueeze_11_output_0&/blocks.15/self_attn/Concat_7_output_0/blocks.15/self_attn/Concat_7"Concat* axis  !/blocks.15/self_attn/Add_output_0'/blocks.15/self_attn/Transpose_output_0/blocks.15/self_attn/Transpose" Transpose* perm@@@@  &/blocks.15/self_attn/Concat_5_output_0)/blocks.15/self_attn/Transpose_1_output_0 /blocks.15/self_attn/Transpose_1" Transpose* perm@@@@  &/blocks.15/self_attn/Concat_6_output_0)/blocks.15/self_attn/Transpose_2_output_0 /blocks.15/self_attn/Transpose_2" Transpose* perm@@@@ w )/blocks.15/self_attn/Transpose_1_output_0%/blocks.15/self_attn/Shape_4_output_0/blocks.15/self_attn/Shape_4"Shape )/blocks.15/self_attn/Constant_30_output_0 /blocks.15/self_attn/Constant_30"Constant*F value*:B,/blocks.15/self_attn/Constant_30_attr::valueJ  %/blocks.15/self_attn/Shape_4_output_0 )/blocks.15/self_attn/Constant_30_output_0&/blocks.15/self_attn/Gather_6_output_0/blocks.15/self_attn/Gather_6"Gather* axis w )/blocks.15/self_attn/Transpose_1_output_0%/blocks.15/self_attn/Shape_5_output_0/blocks.15/self_attn/Shape_5"Shape )/blocks.15/self_attn/Constant_31_output_0 /blocks.15/self_attn/Constant_31"Constant*F value*:B,/blocks.15/self_attn/Constant_31_attr::valueJ  %/blocks.15/self_attn/Shape_5_output_0 )/blocks.15/self_attn/Constant_31_output_0&/blocks.15/self_attn/Gather_7_output_0/blocks.15/self_attn/Gather_7"Gather* axis w )/blocks.15/self_attn/Transpose_1_output_0%/blocks.15/self_attn/Shape_6_output_0/blocks.15/self_attn/Shape_6"Shape )/blocks.15/self_attn/Constant_32_output_0 /blocks.15/self_attn/Constant_32"Constant*F value*:B,/blocks.15/self_attn/Constant_32_attr::valueJ  %/blocks.15/self_attn/Shape_6_output_0 )/blocks.15/self_attn/Constant_32_output_0&/blocks.15/self_attn/Gather_8_output_0/blocks.15/self_attn/Gather_8"Gather* axis w )/blocks.15/self_attn/Transpose_1_output_0%/blocks.15/self_attn/Shape_7_output_0/blocks.15/self_attn/Shape_7"Shape )/blocks.15/self_attn/Constant_33_output_0 /blocks.15/self_attn/Constant_33"Constant*F value*:B,/blocks.15/self_attn/Constant_33_attr::valueJ  %/blocks.15/self_attn/Shape_7_output_0 )/blocks.15/self_attn/Constant_33_output_0&/blocks.15/self_attn/Gather_9_output_0/blocks.15/self_attn/Gather_9"Gather* axis )/blocks.15/self_attn/Constant_34_output_0 /blocks.15/self_attn/Constant_34"Constant*H value*<B,/blocks.15/self_attn/Constant_34_attr::valueJ  )/blocks.15/self_attn/Transpose_1_output_0 )/blocks.15/self_attn/Constant_34_output_0*/blocks.15/self_attn/Unsqueeze_12_output_0!/blocks.15/self_attn/Unsqueeze_12" Unsqueeze )/blocks.15/self_attn/Constant_35_output_0 /blocks.15/self_attn/Constant_35"Constant*H value*<B,/blocks.15/self_attn/Constant_35_attr::valueJ  &/blocks.15/self_attn/Gather_6_output_0 )/blocks.15/self_attn/Constant_35_output_0*/blocks.15/self_attn/Unsqueeze_13_output_0!/blocks.15/self_attn/Unsqueeze_13" Unsqueeze )/blocks.15/self_attn/Constant_36_output_0 /blocks.15/self_attn/Constant_36"Constant*H value*<B,/blocks.15/self_attn/Constant_36_attr::valueJ  &/blocks.15/self_attn/Gather_7_output_0 )/blocks.15/self_attn/Constant_36_output_0*/blocks.15/self_attn/Unsqueeze_14_output_0!/blocks.15/self_attn/Unsqueeze_14" Unsqueeze )/blocks.15/self_attn/Constant_37_output_0 /blocks.15/self_attn/Constant_37"Constant*H value*<B,/blocks.15/self_attn/Constant_37_attr::valueJ )/blocks.15/self_attn/Constant_38_output_0 /blocks.15/self_attn/Constant_38"Constant*H value*<B,/blocks.15/self_attn/Constant_38_attr::valueJ  &/blocks.15/self_attn/Gather_8_output_0 )/blocks.15/self_attn/Constant_38_output_0*/blocks.15/self_attn/Unsqueeze_15_output_0!/blocks.15/self_attn/Unsqueeze_15" Unsqueeze )/blocks.15/self_attn/Constant_39_output_0 /blocks.15/self_attn/Constant_39"Constant*H value*<B,/blocks.15/self_attn/Constant_39_attr::valueJ  &/blocks.15/self_attn/Gather_9_output_0 )/blocks.15/self_attn/Constant_39_output_0*/blocks.15/self_attn/Unsqueeze_16_output_0!/blocks.15/self_attn/Unsqueeze_16" Unsqueeze  */blocks.15/self_attn/Unsqueeze_13_output_0 */blocks.15/self_attn/Unsqueeze_14_output_0 )/blocks.15/self_attn/Constant_37_output_0 */blocks.15/self_attn/Unsqueeze_15_output_0 */blocks.15/self_attn/Unsqueeze_16_output_0&/blocks.15/self_attn/Concat_8_output_0/blocks.15/self_attn/Concat_8"Concat* axis )/blocks.15/self_attn/Constant_40_output_0 /blocks.15/self_attn/Constant_40"Constant*H value*<B,/blocks.15/self_attn/Constant_40_attr::valueJ  &/blocks.15/self_attn/Concat_8_output_0 )/blocks.15/self_attn/Constant_40_output_0'/blocks.15/self_attn/Reshape_3_output_0/blocks.15/self_attn/Reshape_3"Reshape* allowzero u '/blocks.15/self_attn/Reshape_3_output_0%/blocks.15/self_attn/Shape_8_output_0/blocks.15/self_attn/Shape_8"Shape  %/blocks.15/self_attn/Shape_8_output_0-/blocks.15/self_attn/ConstantOfShape_output_0$/blocks.15/self_attn/ConstantOfShape"ConstantOfShape*L value*@B0/blocks.15/self_attn/ConstantOfShape_attr::valueJ )/blocks.15/self_attn/Constant_41_output_0 /blocks.15/self_attn/Constant_41"Constant*F value*:B,/blocks.15/self_attn/Constant_41_attr::valueJ  -/blocks.15/self_attn/ConstantOfShape_output_0 )/blocks.15/self_attn/Constant_41_output_0#/blocks.15/self_attn/Mul_4_output_0/blocks.15/self_attn/Mul_4"Mul  '/blocks.15/self_attn/Reshape_3_output_0 #/blocks.15/self_attn/Mul_4_output_0#/blocks.15/self_attn/Equal_output_0/blocks.15/self_attn/Equal"Equal  #/blocks.15/self_attn/Equal_output_0 -/blocks.15/self_attn/ConstantOfShape_output_0 '/blocks.15/self_attn/Reshape_3_output_0#/blocks.15/self_attn/Where_output_0/blocks.15/self_attn/Where"Where  */blocks.15/self_attn/Unsqueeze_12_output_0 #/blocks.15/self_attn/Where_output_0$/blocks.15/self_attn/Expand_output_0/blocks.15/self_attn/Expand"Expand )/blocks.15/self_attn/Constant_42_output_0 /blocks.15/self_attn/Constant_42"Constant*F value*:B,/blocks.15/self_attn/Constant_42_attr::valueJ  &/blocks.15/self_attn/Gather_7_output_0 )/blocks.15/self_attn/Constant_42_output_0#/blocks.15/self_attn/Mul_5_output_0/blocks.15/self_attn/Mul_5"Mul fonnx::Unsqueeze_4897 Constant_6640"Constant*5 value*)BConstant_6640_attr::valueJ  &/blocks.15/self_attn/Gather_6_output_0 onnx::Unsqueeze_4897*/blocks.15/self_attn/Unsqueeze_17_output_0!/blocks.15/self_attn/Unsqueeze_17" Unsqueeze fonnx::Unsqueeze_4899 Constant_6642"Constant*5 value*)BConstant_6642_attr::valueJ  #/blocks.15/self_attn/Mul_5_output_0 onnx::Unsqueeze_4899*/blocks.15/self_attn/Unsqueeze_18_output_0!/blocks.15/self_attn/Unsqueeze_18" Unsqueeze fonnx::Unsqueeze_4901 Constant_6644"Constant*5 value*)BConstant_6644_attr::valueJ  &/blocks.15/self_attn/Gather_8_output_0 onnx::Unsqueeze_4901*/blocks.15/self_attn/Unsqueeze_19_output_0!/blocks.15/self_attn/Unsqueeze_19" Unsqueeze fonnx::Unsqueeze_4903 Constant_6646"Constant*5 value*)BConstant_6646_attr::valueJ  &/blocks.15/self_attn/Gather_9_output_0 onnx::Unsqueeze_4903*/blocks.15/self_attn/Unsqueeze_20_output_0!/blocks.15/self_attn/Unsqueeze_20" Unsqueeze  */blocks.15/self_attn/Unsqueeze_17_output_0 */blocks.15/self_attn/Unsqueeze_18_output_0 */blocks.15/self_attn/Unsqueeze_19_output_0 */blocks.15/self_attn/Unsqueeze_20_output_0&/blocks.15/self_attn/Concat_9_output_0/blocks.15/self_attn/Concat_9"Concat* axis  $/blocks.15/self_attn/Expand_output_0 &/blocks.15/self_attn/Concat_9_output_0'/blocks.15/self_attn/Reshape_4_output_0/blocks.15/self_attn/Reshape_4"Reshape* allowzero w )/blocks.15/self_attn/Transpose_2_output_0%/blocks.15/self_attn/Shape_9_output_0/blocks.15/self_attn/Shape_9"Shape )/blocks.15/self_attn/Constant_43_output_0 /blocks.15/self_attn/Constant_43"Constant*F value*:B,/blocks.15/self_attn/Constant_43_attr::valueJ  %/blocks.15/self_attn/Shape_9_output_0 )/blocks.15/self_attn/Constant_43_output_0'/blocks.15/self_attn/Gather_10_output_0/blocks.15/self_attn/Gather_10"Gather* axis y )/blocks.15/self_attn/Transpose_2_output_0&/blocks.15/self_attn/Shape_10_output_0/blocks.15/self_attn/Shape_10"Shape )/blocks.15/self_attn/Constant_44_output_0 /blocks.15/self_attn/Constant_44"Constant*F value*:B,/blocks.15/self_attn/Constant_44_attr::valueJ  &/blocks.15/self_attn/Shape_10_output_0 )/blocks.15/self_attn/Constant_44_output_0'/blocks.15/self_attn/Gather_11_output_0/blocks.15/self_attn/Gather_11"Gather* axis y )/blocks.15/self_attn/Transpose_2_output_0&/blocks.15/self_attn/Shape_11_output_0/blocks.15/self_attn/Shape_11"Shape )/blocks.15/self_attn/Constant_45_output_0 /blocks.15/self_attn/Constant_45"Constant*F value*:B,/blocks.15/self_attn/Constant_45_attr::valueJ  &/blocks.15/self_attn/Shape_11_output_0 )/blocks.15/self_attn/Constant_45_output_0'/blocks.15/self_attn/Gather_12_output_0/blocks.15/self_attn/Gather_12"Gather* axis y )/blocks.15/self_attn/Transpose_2_output_0&/blocks.15/self_attn/Shape_12_output_0/blocks.15/self_attn/Shape_12"Shape )/blocks.15/self_attn/Constant_46_output_0 /blocks.15/self_attn/Constant_46"Constant*F value*:B,/blocks.15/self_attn/Constant_46_attr::valueJ  &/blocks.15/self_attn/Shape_12_output_0 )/blocks.15/self_attn/Constant_46_output_0'/blocks.15/self_attn/Gather_13_output_0/blocks.15/self_attn/Gather_13"Gather* axis )/blocks.15/self_attn/Constant_47_output_0 /blocks.15/self_attn/Constant_47"Constant*H value*<B,/blocks.15/self_attn/Constant_47_attr::valueJ  )/blocks.15/self_attn/Transpose_2_output_0 )/blocks.15/self_attn/Constant_47_output_0*/blocks.15/self_attn/Unsqueeze_21_output_0!/blocks.15/self_attn/Unsqueeze_21" Unsqueeze )/blocks.15/self_attn/Constant_48_output_0 /blocks.15/self_attn/Constant_48"Constant*H value*<B,/blocks.15/self_attn/Constant_48_attr::valueJ  '/blocks.15/self_attn/Gather_10_output_0 )/blocks.15/self_attn/Constant_48_output_0*/blocks.15/self_attn/Unsqueeze_22_output_0!/blocks.15/self_attn/Unsqueeze_22" Unsqueeze )/blocks.15/self_attn/Constant_49_output_0 /blocks.15/self_attn/Constant_49"Constant*H value*<B,/blocks.15/self_attn/Constant_49_attr::valueJ  '/blocks.15/self_attn/Gather_11_output_0 )/blocks.15/self_attn/Constant_49_output_0*/blocks.15/self_attn/Unsqueeze_23_output_0!/blocks.15/self_attn/Unsqueeze_23" Unsqueeze )/blocks.15/self_attn/Constant_50_output_0 /blocks.15/self_attn/Constant_50"Constant*H value*<B,/blocks.15/self_attn/Constant_50_attr::valueJ )/blocks.15/self_attn/Constant_51_output_0 /blocks.15/self_attn/Constant_51"Constant*H value*<B,/blocks.15/self_attn/Constant_51_attr::valueJ  '/blocks.15/self_attn/Gather_12_output_0 )/blocks.15/self_attn/Constant_51_output_0*/blocks.15/self_attn/Unsqueeze_24_output_0!/blocks.15/self_attn/Unsqueeze_24" Unsqueeze )/blocks.15/self_attn/Constant_52_output_0 /blocks.15/self_attn/Constant_52"Constant*H value*<B,/blocks.15/self_attn/Constant_52_attr::valueJ  '/blocks.15/self_attn/Gather_13_output_0 )/blocks.15/self_attn/Constant_52_output_0*/blocks.15/self_attn/Unsqueeze_25_output_0!/blocks.15/self_attn/Unsqueeze_25" Unsqueeze  */blocks.15/self_attn/Unsqueeze_22_output_0 */blocks.15/self_attn/Unsqueeze_23_output_0 )/blocks.15/self_attn/Constant_50_output_0 */blocks.15/self_attn/Unsqueeze_24_output_0 */blocks.15/self_attn/Unsqueeze_25_output_0'/blocks.15/self_attn/Concat_10_output_0/blocks.15/self_attn/Concat_10"Concat* axis )/blocks.15/self_attn/Constant_53_output_0 /blocks.15/self_attn/Constant_53"Constant*H value*<B,/blocks.15/self_attn/Constant_53_attr::valueJ  '/blocks.15/self_attn/Concat_10_output_0 )/blocks.15/self_attn/Constant_53_output_0'/blocks.15/self_attn/Reshape_5_output_0/blocks.15/self_attn/Reshape_5"Reshape* allowzero w '/blocks.15/self_attn/Reshape_5_output_0&/blocks.15/self_attn/Shape_13_output_0/blocks.15/self_attn/Shape_13"Shape  &/blocks.15/self_attn/Shape_13_output_0//blocks.15/self_attn/ConstantOfShape_1_output_0&/blocks.15/self_attn/ConstantOfShape_1"ConstantOfShape*N value*BB2/blocks.15/self_attn/ConstantOfShape_1_attr::valueJ )/blocks.15/self_attn/Constant_54_output_0 /blocks.15/self_attn/Constant_54"Constant*F value*:B,/blocks.15/self_attn/Constant_54_attr::valueJ  //blocks.15/self_attn/ConstantOfShape_1_output_0 )/blocks.15/self_attn/Constant_54_output_0#/blocks.15/self_attn/Mul_6_output_0/blocks.15/self_attn/Mul_6"Mul  '/blocks.15/self_attn/Reshape_5_output_0 #/blocks.15/self_attn/Mul_6_output_0%/blocks.15/self_attn/Equal_1_output_0/blocks.15/self_attn/Equal_1"Equal  %/blocks.15/self_attn/Equal_1_output_0 //blocks.15/self_attn/ConstantOfShape_1_output_0 '/blocks.15/self_attn/Reshape_5_output_0%/blocks.15/self_attn/Where_1_output_0/blocks.15/self_attn/Where_1"Where  */blocks.15/self_attn/Unsqueeze_21_output_0 %/blocks.15/self_attn/Where_1_output_0&/blocks.15/self_attn/Expand_1_output_0/blocks.15/self_attn/Expand_1"Expand )/blocks.15/self_attn/Constant_55_output_0 /blocks.15/self_attn/Constant_55"Constant*F value*:B,/blocks.15/self_attn/Constant_55_attr::valueJ  '/blocks.15/self_attn/Gather_11_output_0 )/blocks.15/self_attn/Constant_55_output_0#/blocks.15/self_attn/Mul_7_output_0/blocks.15/self_attn/Mul_7"Mul fonnx::Unsqueeze_4943 Constant_6685"Constant*5 value*)BConstant_6685_attr::valueJ  '/blocks.15/self_attn/Gather_10_output_0 onnx::Unsqueeze_4943*/blocks.15/self_attn/Unsqueeze_26_output_0!/blocks.15/self_attn/Unsqueeze_26" Unsqueeze fonnx::Unsqueeze_4945 Constant_6687"Constant*5 value*)BConstant_6687_attr::valueJ  #/blocks.15/self_attn/Mul_7_output_0 onnx::Unsqueeze_4945*/blocks.15/self_attn/Unsqueeze_27_output_0!/blocks.15/self_attn/Unsqueeze_27" Unsqueeze fonnx::Unsqueeze_4947 Constant_6689"Constant*5 value*)BConstant_6689_attr::valueJ  '/blocks.15/self_attn/Gather_12_output_0 onnx::Unsqueeze_4947*/blocks.15/self_attn/Unsqueeze_28_output_0!/blocks.15/self_attn/Unsqueeze_28" Unsqueeze fonnx::Unsqueeze_4949 Constant_6691"Constant*5 value*)BConstant_6691_attr::valueJ  '/blocks.15/self_attn/Gather_13_output_0 onnx::Unsqueeze_4949*/blocks.15/self_attn/Unsqueeze_29_output_0!/blocks.15/self_attn/Unsqueeze_29" Unsqueeze  */blocks.15/self_attn/Unsqueeze_26_output_0 */blocks.15/self_attn/Unsqueeze_27_output_0 */blocks.15/self_attn/Unsqueeze_28_output_0 */blocks.15/self_attn/Unsqueeze_29_output_0'/blocks.15/self_attn/Concat_11_output_0/blocks.15/self_attn/Concat_11"Concat* axis  &/blocks.15/self_attn/Expand_1_output_0 '/blocks.15/self_attn/Concat_11_output_0'/blocks.15/self_attn/Reshape_6_output_0/blocks.15/self_attn/Reshape_6"Reshape* allowzero  '/blocks.15/self_attn/Transpose_output_0 '/blocks.15/self_attn/Reshape_4_output_0$/blocks.15/self_attn/MatMul_output_0/blocks.15/self_attn/MatMul"MatMul )/blocks.15/self_attn/Constant_56_output_0 /blocks.15/self_attn/Constant_56"Constant*B value*6B,/blocks.15/self_attn/Constant_56_attr::valueJ5A  $/blocks.15/self_attn/MatMul_output_0 )/blocks.15/self_attn/Constant_56_output_0#/blocks.15/self_attn/Div_2_output_0/blocks.15/self_attn/Div_2"Div { #/blocks.15/self_attn/Div_2_output_0 attention_mask#/blocks.15/self_attn/Add_2_output_0/blocks.15/self_attn/Add_2"Add  #/blocks.15/self_attn/Add_2_output_0%/blocks.15/self_attn/Softmax_output_0/blocks.15/self_attn/Softmax"Softmax* axis { %/blocks.15/self_attn/Softmax_output_0$/blocks.15/self_attn/Cast_4_output_0/blocks.15/self_attn/Cast_4"Cast* to  $/blocks.15/self_attn/Cast_4_output_0 '/blocks.15/self_attn/Reshape_6_output_0&/blocks.15/self_attn/MatMul_1_output_0/blocks.15/self_attn/MatMul_1"MatMul  &/blocks.15/self_attn/MatMul_1_output_0)/blocks.15/self_attn/Transpose_3_output_0 /blocks.15/self_attn/Transpose_3" Transpose* perm@@@@ fonnx::Unsqueeze_4961 Constant_6703"Constant*5 value*)BConstant_6703_attr::valueJ  $/blocks.15/self_attn/Gather_output_0 onnx::Unsqueeze_4961*/blocks.15/self_attn/Unsqueeze_30_output_0!/blocks.15/self_attn/Unsqueeze_30" Unsqueeze fonnx::Unsqueeze_4963 Constant_6705"Constant*5 value*)BConstant_6705_attr::valueJ  &/blocks.15/self_attn/Gather_1_output_0 onnx::Unsqueeze_4963*/blocks.15/self_attn/Unsqueeze_31_output_0!/blocks.15/self_attn/Unsqueeze_31" Unsqueeze )/blocks.15/self_attn/Constant_57_output_0 /blocks.15/self_attn/Constant_57"Constant*H value*<B,/blocks.15/self_attn/Constant_57_attr::valueJ  */blocks.15/self_attn/Unsqueeze_30_output_0 */blocks.15/self_attn/Unsqueeze_31_output_0 )/blocks.15/self_attn/Constant_57_output_0'/blocks.15/self_attn/Concat_12_output_0/blocks.15/self_attn/Concat_12"Concat* axis  )/blocks.15/self_attn/Transpose_3_output_0 '/blocks.15/self_attn/Concat_12_output_0'/blocks.15/self_attn/Reshape_7_output_0/blocks.15/self_attn/Reshape_7"Reshape* allowzero  '/blocks.15/self_attn/Reshape_7_output_0 onnx::MatMul_9009+/blocks.15/self_attn/o_proj/MatMul_output_0"/blocks.15/self_attn/o_proj/MatMul"MatMul  */blocks.15/input_layernorm/Cast_1_output_0 +/blocks.15/self_attn/o_proj/MatMul_output_0/blocks.15/Add_output_0/blocks.15/Add"Add  /blocks.15/Add_output_01/blocks.15/post_attention_layernorm/Cast_output_0(/blocks.15/post_attention_layernorm/Cast"Cast* to 5/blocks.15/post_attention_layernorm/Constant_output_0,/blocks.15/post_attention_layernorm/Constant"Constant*N value*BB8/blocks.15/post_attention_layernorm/Constant_attr::valueJ@  1/blocks.15/post_attention_layernorm/Cast_output_0 5/blocks.15/post_attention_layernorm/Constant_output_00/blocks.15/post_attention_layernorm/Pow_output_0'/blocks.15/post_attention_layernorm/Pow"Pow  0/blocks.15/post_attention_layernorm/Pow_output_07/blocks.15/post_attention_layernorm/ReduceMean_output_0./blocks.15/post_attention_layernorm/ReduceMean" ReduceMean* axes@* keepdims 7/blocks.15/post_attention_layernorm/Constant_1_output_0./blocks.15/post_attention_layernorm/Constant_1"Constant*P value*DB:/blocks.15/post_attention_layernorm/Constant_1_attr::valueJ75  7/blocks.15/post_attention_layernorm/ReduceMean_output_0 7/blocks.15/post_attention_layernorm/Constant_1_output_00/blocks.15/post_attention_layernorm/Add_output_0'/blocks.15/post_attention_layernorm/Add"Add  0/blocks.15/post_attention_layernorm/Add_output_01/blocks.15/post_attention_layernorm/Sqrt_output_0(/blocks.15/post_attention_layernorm/Sqrt"Sqrt 7/blocks.15/post_attention_layernorm/Constant_2_output_0./blocks.15/post_attention_layernorm/Constant_2"Constant*P value*DB:/blocks.15/post_attention_layernorm/Constant_2_attr::valueJ?  7/blocks.15/post_attention_layernorm/Constant_2_output_0 1/blocks.15/post_attention_layernorm/Sqrt_output_00/blocks.15/post_attention_layernorm/Div_output_0'/blocks.15/post_attention_layernorm/Div"Div  1/blocks.15/post_attention_layernorm/Cast_output_03/blocks.15/post_attention_layernorm/Cast_1_output_0*/blocks.15/post_attention_layernorm/Cast_1"Cast* to  3/blocks.15/post_attention_layernorm/Cast_1_output_0 0/blocks.15/post_attention_layernorm/Div_output_00/blocks.15/post_attention_layernorm/Mul_output_0'/blocks.15/post_attention_layernorm/Mul"Mul  0/blocks.15/post_attention_layernorm/Mul_output_0 )blocks.15.post_attention_layernorm.weight2/blocks.15/post_attention_layernorm/Mul_1_output_0)/blocks.15/post_attention_layernorm/Mul_1"Mul  2/blocks.15/post_attention_layernorm/Mul_1_output_03/blocks.15/post_attention_layernorm/Cast_2_output_0*/blocks.15/post_attention_layernorm/Cast_2"Cast* to  3/blocks.15/post_attention_layernorm/Cast_2_output_0 onnx::MatMul_9010(/blocks.15/mlp/gate_proj/MatMul_output_0/blocks.15/mlp/gate_proj/MatMul"MatMul z (/blocks.15/mlp/gate_proj/MatMul_output_0&/blocks.15/mlp/act_fn/Sigmoid_output_0/blocks.15/mlp/act_fn/Sigmoid"Sigmoid  (/blocks.15/mlp/gate_proj/MatMul_output_0 &/blocks.15/mlp/act_fn/Sigmoid_output_0"/blocks.15/mlp/act_fn/Mul_output_0/blocks.15/mlp/act_fn/Mul"Mul  3/blocks.15/post_attention_layernorm/Cast_2_output_0 onnx::MatMul_9011&/blocks.15/mlp/up_proj/MatMul_output_0/blocks.15/mlp/up_proj/MatMul"MatMul  "/blocks.15/mlp/act_fn/Mul_output_0 &/blocks.15/mlp/up_proj/MatMul_output_0/blocks.15/mlp/Mul_output_0/blocks.15/mlp/Mul"Mul  /blocks.15/mlp/Mul_output_0 onnx::MatMul_9012(/blocks.15/mlp/down_proj/MatMul_output_0/blocks.15/mlp/down_proj/MatMul"MatMul  3/blocks.15/post_attention_layernorm/Cast_1_output_0 (/blocks.15/mlp/down_proj/MatMul_output_0/blocks.15/Add_1_output_0/blocks.15/Add_1"Add p past_key_values '/blocks.0/self_attn/Constant_2_output_0/Gather_16_output_0 /Gather_16"Gather* axis /blocks.16/Constant_output_0/blocks.16/Constant"Constant*K value*?B/blocks.16/Constant_attr::valueJ  /blocks.15/Add_1_output_0 /blocks.16/Constant_output_0/blocks.16/Reshape_output_0/blocks.16/Reshape"Reshape* allowzero y /blocks.16/Reshape_output_0(/blocks.16/input_layernorm/Cast_output_0/blocks.16/input_layernorm/Cast"Cast* to ,/blocks.16/input_layernorm/Constant_output_0#/blocks.16/input_layernorm/Constant"Constant*E value*9B//blocks.16/input_layernorm/Constant_attr::valueJ@  (/blocks.16/input_layernorm/Cast_output_0 ,/blocks.16/input_layernorm/Constant_output_0'/blocks.16/input_layernorm/Pow_output_0/blocks.16/input_layernorm/Pow"Pow  '/blocks.16/input_layernorm/Pow_output_0./blocks.16/input_layernorm/ReduceMean_output_0%/blocks.16/input_layernorm/ReduceMean" ReduceMean* axes@* keepdims ./blocks.16/input_layernorm/Constant_1_output_0%/blocks.16/input_layernorm/Constant_1"Constant*G value*;B1/blocks.16/input_layernorm/Constant_1_attr::valueJ75  ./blocks.16/input_layernorm/ReduceMean_output_0 ./blocks.16/input_layernorm/Constant_1_output_0'/blocks.16/input_layernorm/Add_output_0/blocks.16/input_layernorm/Add"Add z '/blocks.16/input_layernorm/Add_output_0(/blocks.16/input_layernorm/Sqrt_output_0/blocks.16/input_layernorm/Sqrt"Sqrt ./blocks.16/input_layernorm/Constant_2_output_0%/blocks.16/input_layernorm/Constant_2"Constant*G value*;B1/blocks.16/input_layernorm/Constant_2_attr::valueJ?  ./blocks.16/input_layernorm/Constant_2_output_0 (/blocks.16/input_layernorm/Sqrt_output_0'/blocks.16/input_layernorm/Div_output_0/blocks.16/input_layernorm/Div"Div  (/blocks.16/input_layernorm/Cast_output_0*/blocks.16/input_layernorm/Cast_1_output_0!/blocks.16/input_layernorm/Cast_1"Cast* to  */blocks.16/input_layernorm/Cast_1_output_0 '/blocks.16/input_layernorm/Div_output_0'/blocks.16/input_layernorm/Mul_output_0/blocks.16/input_layernorm/Mul"Mul  '/blocks.16/input_layernorm/Mul_output_0 blocks.16.input_layernorm.weight)/blocks.16/input_layernorm/Mul_1_output_0 /blocks.16/input_layernorm/Mul_1"Mul  )/blocks.16/input_layernorm/Mul_1_output_0*/blocks.16/input_layernorm/Cast_2_output_0!/blocks.16/input_layernorm/Cast_2"Cast* to t */blocks.16/input_layernorm/Cast_2_output_0#/blocks.16/self_attn/Shape_output_0/blocks.16/self_attn/Shape"Shape &/blocks.16/self_attn/Constant_output_0/blocks.16/self_attn/Constant"Constant*C value*7B)/blocks.16/self_attn/Constant_attr::valueJ  #/blocks.16/self_attn/Shape_output_0 &/blocks.16/self_attn/Constant_output_0$/blocks.16/self_attn/Gather_output_0/blocks.16/self_attn/Gather"Gather* axis x */blocks.16/input_layernorm/Cast_2_output_0%/blocks.16/self_attn/Shape_1_output_0/blocks.16/self_attn/Shape_1"Shape (/blocks.16/self_attn/Constant_1_output_0/blocks.16/self_attn/Constant_1"Constant*E value*9B+/blocks.16/self_attn/Constant_1_attr::valueJ  %/blocks.16/self_attn/Shape_1_output_0 (/blocks.16/self_attn/Constant_1_output_0&/blocks.16/self_attn/Gather_1_output_0/blocks.16/self_attn/Gather_1"Gather* axis  */blocks.16/input_layernorm/Cast_2_output_0 onnx::MatMul_9013+/blocks.16/self_attn/q_proj/MatMul_output_0"/blocks.16/self_attn/q_proj/MatMul"MatMul  */blocks.16/input_layernorm/Cast_2_output_0 onnx::MatMul_9014+/blocks.16/self_attn/k_proj/MatMul_output_0"/blocks.16/self_attn/k_proj/MatMul"MatMul  */blocks.16/input_layernorm/Cast_2_output_0 onnx::MatMul_9015+/blocks.16/self_attn/v_proj/MatMul_output_0"/blocks.16/self_attn/v_proj/MatMul"MatMul fonnx::Unsqueeze_5023 Constant_6757"Constant*5 value*)BConstant_6757_attr::valueJ  $/blocks.16/self_attn/Gather_output_0 onnx::Unsqueeze_5023'/blocks.16/self_attn/Unsqueeze_output_0/blocks.16/self_attn/Unsqueeze" Unsqueeze fonnx::Unsqueeze_5025 Constant_6759"Constant*5 value*)BConstant_6759_attr::valueJ  &/blocks.16/self_attn/Gather_1_output_0 onnx::Unsqueeze_5025)/blocks.16/self_attn/Unsqueeze_1_output_0 /blocks.16/self_attn/Unsqueeze_1" Unsqueeze (/blocks.16/self_attn/Constant_2_output_0/blocks.16/self_attn/Constant_2"Constant*G value*;B+/blocks.16/self_attn/Constant_2_attr::valueJ (/blocks.16/self_attn/Constant_3_output_0/blocks.16/self_attn/Constant_3"Constant*G value*;B+/blocks.16/self_attn/Constant_3_attr::valueJ  '/blocks.16/self_attn/Unsqueeze_output_0 )/blocks.16/self_attn/Unsqueeze_1_output_0 (/blocks.16/self_attn/Constant_2_output_0 (/blocks.16/self_attn/Constant_3_output_0$/blocks.16/self_attn/Concat_output_0/blocks.16/self_attn/Concat"Concat* axis  +/blocks.16/self_attn/q_proj/MatMul_output_0 $/blocks.16/self_attn/Concat_output_0%/blocks.16/self_attn/Reshape_output_0/blocks.16/self_attn/Reshape"Reshape* allowzero fonnx::Unsqueeze_5033 Constant_6765"Constant*5 value*)BConstant_6765_attr::valueJ  $/blocks.16/self_attn/Gather_output_0 onnx::Unsqueeze_5033)/blocks.16/self_attn/Unsqueeze_2_output_0 /blocks.16/self_attn/Unsqueeze_2" Unsqueeze fonnx::Unsqueeze_5035 Constant_6767"Constant*5 value*)BConstant_6767_attr::valueJ  &/blocks.16/self_attn/Gather_1_output_0 onnx::Unsqueeze_5035)/blocks.16/self_attn/Unsqueeze_3_output_0 /blocks.16/self_attn/Unsqueeze_3" Unsqueeze (/blocks.16/self_attn/Constant_4_output_0/blocks.16/self_attn/Constant_4"Constant*G value*;B+/blocks.16/self_attn/Constant_4_attr::valueJ (/blocks.16/self_attn/Constant_5_output_0/blocks.16/self_attn/Constant_5"Constant*G value*;B+/blocks.16/self_attn/Constant_5_attr::valueJ  )/blocks.16/self_attn/Unsqueeze_2_output_0 )/blocks.16/self_attn/Unsqueeze_3_output_0 (/blocks.16/self_attn/Constant_4_output_0 (/blocks.16/self_attn/Constant_5_output_0&/blocks.16/self_attn/Concat_1_output_0/blocks.16/self_attn/Concat_1"Concat* axis fonnx::Unsqueeze_5042 Constant_6772"Constant*5 value*)BConstant_6772_attr::valueJ  $/blocks.16/self_attn/Gather_output_0 onnx::Unsqueeze_5042)/blocks.16/self_attn/Unsqueeze_4_output_0 /blocks.16/self_attn/Unsqueeze_4" Unsqueeze fonnx::Unsqueeze_5044 Constant_6774"Constant*5 value*)BConstant_6774_attr::valueJ  &/blocks.16/self_attn/Gather_1_output_0 onnx::Unsqueeze_5044)/blocks.16/self_attn/Unsqueeze_5_output_0 /blocks.16/self_attn/Unsqueeze_5" Unsqueeze (/blocks.16/self_attn/Constant_6_output_0/blocks.16/self_attn/Constant_6"Constant*G value*;B+/blocks.16/self_attn/Constant_6_attr::valueJ (/blocks.16/self_attn/Constant_7_output_0/blocks.16/self_attn/Constant_7"Constant*G value*;B+/blocks.16/self_attn/Constant_7_attr::valueJ  )/blocks.16/self_attn/Unsqueeze_4_output_0 )/blocks.16/self_attn/Unsqueeze_5_output_0 (/blocks.16/self_attn/Constant_6_output_0 (/blocks.16/self_attn/Constant_7_output_0&/blocks.16/self_attn/Concat_2_output_0/blocks.16/self_attn/Concat_2"Concat* axis  +/blocks.16/self_attn/k_proj/MatMul_output_0 &/blocks.16/self_attn/Concat_1_output_0'/blocks.16/self_attn/Reshape_1_output_0/blocks.16/self_attn/Reshape_1"Reshape* allowzero  +/blocks.16/self_attn/v_proj/MatMul_output_0 &/blocks.16/self_attn/Concat_2_output_0'/blocks.16/self_attn/Reshape_2_output_0/blocks.16/self_attn/Reshape_2"Reshape* allowzero  %/blocks.16/self_attn/Reshape_output_0)/blocks.16/self_attn/q_norm/Cast_output_0 /blocks.16/self_attn/q_norm/Cast"Cast* to -/blocks.16/self_attn/q_norm/Constant_output_0$/blocks.16/self_attn/q_norm/Constant"Constant*F value*:B0/blocks.16/self_attn/q_norm/Constant_attr::valueJ@  )/blocks.16/self_attn/q_norm/Cast_output_0 -/blocks.16/self_attn/q_norm/Constant_output_0(/blocks.16/self_attn/q_norm/Pow_output_0/blocks.16/self_attn/q_norm/Pow"Pow  (/blocks.16/self_attn/q_norm/Pow_output_0//blocks.16/self_attn/q_norm/ReduceMean_output_0&/blocks.16/self_attn/q_norm/ReduceMean" ReduceMean* axes@* keepdims //blocks.16/self_attn/q_norm/Constant_1_output_0&/blocks.16/self_attn/q_norm/Constant_1"Constant*H value*<B2/blocks.16/self_attn/q_norm/Constant_1_attr::valueJ75  //blocks.16/self_attn/q_norm/ReduceMean_output_0 //blocks.16/self_attn/q_norm/Constant_1_output_0(/blocks.16/self_attn/q_norm/Add_output_0/blocks.16/self_attn/q_norm/Add"Add } (/blocks.16/self_attn/q_norm/Add_output_0)/blocks.16/self_attn/q_norm/Sqrt_output_0 /blocks.16/self_attn/q_norm/Sqrt"Sqrt //blocks.16/self_attn/q_norm/Constant_2_output_0&/blocks.16/self_attn/q_norm/Constant_2"Constant*H value*<B2/blocks.16/self_attn/q_norm/Constant_2_attr::valueJ?  //blocks.16/self_attn/q_norm/Constant_2_output_0 )/blocks.16/self_attn/q_norm/Sqrt_output_0(/blocks.16/self_attn/q_norm/Div_output_0/blocks.16/self_attn/q_norm/Div"Div  )/blocks.16/self_attn/q_norm/Cast_output_0+/blocks.16/self_attn/q_norm/Cast_1_output_0"/blocks.16/self_attn/q_norm/Cast_1"Cast* to  +/blocks.16/self_attn/q_norm/Cast_1_output_0 (/blocks.16/self_attn/q_norm/Div_output_0(/blocks.16/self_attn/q_norm/Mul_output_0/blocks.16/self_attn/q_norm/Mul"Mul  (/blocks.16/self_attn/q_norm/Mul_output_0 !blocks.16.self_attn.q_norm.weight*/blocks.16/self_attn/q_norm/Mul_1_output_0!/blocks.16/self_attn/q_norm/Mul_1"Mul  */blocks.16/self_attn/q_norm/Mul_1_output_0+/blocks.16/self_attn/q_norm/Cast_2_output_0"/blocks.16/self_attn/q_norm/Cast_2"Cast* to  '/blocks.16/self_attn/Reshape_1_output_0)/blocks.16/self_attn/k_norm/Cast_output_0 /blocks.16/self_attn/k_norm/Cast"Cast* to -/blocks.16/self_attn/k_norm/Constant_output_0$/blocks.16/self_attn/k_norm/Constant"Constant*F value*:B0/blocks.16/self_attn/k_norm/Constant_attr::valueJ@  )/blocks.16/self_attn/k_norm/Cast_output_0 -/blocks.16/self_attn/k_norm/Constant_output_0(/blocks.16/self_attn/k_norm/Pow_output_0/blocks.16/self_attn/k_norm/Pow"Pow  (/blocks.16/self_attn/k_norm/Pow_output_0//blocks.16/self_attn/k_norm/ReduceMean_output_0&/blocks.16/self_attn/k_norm/ReduceMean" ReduceMean* axes@* keepdims //blocks.16/self_attn/k_norm/Constant_1_output_0&/blocks.16/self_attn/k_norm/Constant_1"Constant*H value*<B2/blocks.16/self_attn/k_norm/Constant_1_attr::valueJ75  //blocks.16/self_attn/k_norm/ReduceMean_output_0 //blocks.16/self_attn/k_norm/Constant_1_output_0(/blocks.16/self_attn/k_norm/Add_output_0/blocks.16/self_attn/k_norm/Add"Add } (/blocks.16/self_attn/k_norm/Add_output_0)/blocks.16/self_attn/k_norm/Sqrt_output_0 /blocks.16/self_attn/k_norm/Sqrt"Sqrt //blocks.16/self_attn/k_norm/Constant_2_output_0&/blocks.16/self_attn/k_norm/Constant_2"Constant*H value*<B2/blocks.16/self_attn/k_norm/Constant_2_attr::valueJ?  //blocks.16/self_attn/k_norm/Constant_2_output_0 )/blocks.16/self_attn/k_norm/Sqrt_output_0(/blocks.16/self_attn/k_norm/Div_output_0/blocks.16/self_attn/k_norm/Div"Div  )/blocks.16/self_attn/k_norm/Cast_output_0+/blocks.16/self_attn/k_norm/Cast_1_output_0"/blocks.16/self_attn/k_norm/Cast_1"Cast* to  +/blocks.16/self_attn/k_norm/Cast_1_output_0 (/blocks.16/self_attn/k_norm/Div_output_0(/blocks.16/self_attn/k_norm/Mul_output_0/blocks.16/self_attn/k_norm/Mul"Mul  (/blocks.16/self_attn/k_norm/Mul_output_0 !blocks.16.self_attn.k_norm.weight*/blocks.16/self_attn/k_norm/Mul_1_output_0!/blocks.16/self_attn/k_norm/Mul_1"Mul  */blocks.16/self_attn/k_norm/Mul_1_output_0+/blocks.16/self_attn/k_norm/Cast_2_output_0"/blocks.16/self_attn/k_norm/Cast_2"Cast* to  +/blocks.16/self_attn/q_norm/Cast_2_output_0 %/blocks.0/self_attn/Gather_2_output_0!/blocks.16/self_attn/Mul_output_0/blocks.16/self_attn/Mul"Mul y +/blocks.16/self_attn/q_norm/Cast_2_output_0%/blocks.16/self_attn/Shape_2_output_0/blocks.16/self_attn/Shape_2"Shape (/blocks.16/self_attn/Constant_8_output_0/blocks.16/self_attn/Constant_8"Constant*E value*9B+/blocks.16/self_attn/Constant_8_attr::valueJ  %/blocks.16/self_attn/Shape_2_output_0 (/blocks.16/self_attn/Constant_8_output_0&/blocks.16/self_attn/Gather_2_output_0/blocks.16/self_attn/Gather_2"Gather* axis (/blocks.16/self_attn/Constant_9_output_0/blocks.16/self_attn/Constant_9"Constant*E value*9B+/blocks.16/self_attn/Constant_9_attr::valueJ  &/blocks.16/self_attn/Gather_2_output_0 (/blocks.16/self_attn/Constant_9_output_0!/blocks.16/self_attn/Div_output_0/blocks.16/self_attn/Div"Div s !/blocks.16/self_attn/Div_output_0"/blocks.16/self_attn/Cast_output_0/blocks.16/self_attn/Cast"Cast* to x "/blocks.16/self_attn/Cast_output_0$/blocks.16/self_attn/Cast_1_output_0/blocks.16/self_attn/Cast_1"Cast* to )/blocks.16/self_attn/Constant_10_output_0 /blocks.16/self_attn/Constant_10"Constant*H value*<B,/blocks.16/self_attn/Constant_10_attr::valueJ )/blocks.16/self_attn/Constant_11_output_0 /blocks.16/self_attn/Constant_11"Constant*H value*<B,/blocks.16/self_attn/Constant_11_attr::valueJ )/blocks.16/self_attn/Constant_12_output_0 /blocks.16/self_attn/Constant_12"Constant*H value*<B,/blocks.16/self_attn/Constant_12_attr::valueJ  $/blocks.16/self_attn/Cast_1_output_0 )/blocks.16/self_attn/Constant_12_output_0)/blocks.16/self_attn/Unsqueeze_6_output_0 /blocks.16/self_attn/Unsqueeze_6" Unsqueeze )/blocks.16/self_attn/Constant_13_output_0 /blocks.16/self_attn/Constant_13"Constant*H value*<B,/blocks.16/self_attn/Constant_13_attr::valueJ  +/blocks.16/self_attn/q_norm/Cast_2_output_0 )/blocks.16/self_attn/Constant_11_output_0 )/blocks.16/self_attn/Unsqueeze_6_output_0 )/blocks.16/self_attn/Constant_10_output_0 )/blocks.16/self_attn/Constant_13_output_0#/blocks.16/self_attn/Slice_output_0/blocks.16/self_attn/Slice"Slice )/blocks.16/self_attn/Constant_14_output_0 /blocks.16/self_attn/Constant_14"Constant*H value*<B,/blocks.16/self_attn/Constant_14_attr::valueJ )/blocks.16/self_attn/Constant_15_output_0 /blocks.16/self_attn/Constant_15"Constant*H value*<B,/blocks.16/self_attn/Constant_15_attr::valueJ  $/blocks.16/self_attn/Cast_1_output_0 )/blocks.16/self_attn/Constant_15_output_0)/blocks.16/self_attn/Unsqueeze_7_output_0 /blocks.16/self_attn/Unsqueeze_7" Unsqueeze )/blocks.16/self_attn/Constant_16_output_0 /blocks.16/self_attn/Constant_16"Constant*H value*<B,/blocks.16/self_attn/Constant_16_attr::valueJ )/blocks.16/self_attn/Constant_17_output_0 /blocks.16/self_attn/Constant_17"Constant*H value*<B,/blocks.16/self_attn/Constant_17_attr::valueJ  +/blocks.16/self_attn/q_norm/Cast_2_output_0 )/blocks.16/self_attn/Unsqueeze_7_output_0 )/blocks.16/self_attn/Constant_16_output_0 )/blocks.16/self_attn/Constant_14_output_0 )/blocks.16/self_attn/Constant_17_output_0%/blocks.16/self_attn/Slice_1_output_0/blocks.16/self_attn/Slice_1"Slice i %/blocks.16/self_attn/Slice_1_output_0!/blocks.16/self_attn/Neg_output_0/blocks.16/self_attn/Neg"Neg  !/blocks.16/self_attn/Neg_output_0 #/blocks.16/self_attn/Slice_output_0&/blocks.16/self_attn/Concat_3_output_0/blocks.16/self_attn/Concat_3"Concat* axis  &/blocks.16/self_attn/Concat_3_output_0 %/blocks.0/self_attn/Gather_3_output_0#/blocks.16/self_attn/Mul_1_output_0/blocks.16/self_attn/Mul_1"Mul  !/blocks.16/self_attn/Mul_output_0 #/blocks.16/self_attn/Mul_1_output_0!/blocks.16/self_attn/Add_output_0/blocks.16/self_attn/Add"Add  +/blocks.16/self_attn/k_norm/Cast_2_output_0 %/blocks.0/self_attn/Gather_2_output_0#/blocks.16/self_attn/Mul_2_output_0/blocks.16/self_attn/Mul_2"Mul y +/blocks.16/self_attn/k_norm/Cast_2_output_0%/blocks.16/self_attn/Shape_3_output_0/blocks.16/self_attn/Shape_3"Shape )/blocks.16/self_attn/Constant_18_output_0 /blocks.16/self_attn/Constant_18"Constant*F value*:B,/blocks.16/self_attn/Constant_18_attr::valueJ  %/blocks.16/self_attn/Shape_3_output_0 )/blocks.16/self_attn/Constant_18_output_0&/blocks.16/self_attn/Gather_3_output_0/blocks.16/self_attn/Gather_3"Gather* axis )/blocks.16/self_attn/Constant_19_output_0 /blocks.16/self_attn/Constant_19"Constant*F value*:B,/blocks.16/self_attn/Constant_19_attr::valueJ  &/blocks.16/self_attn/Gather_3_output_0 )/blocks.16/self_attn/Constant_19_output_0#/blocks.16/self_attn/Div_1_output_0/blocks.16/self_attn/Div_1"Div y #/blocks.16/self_attn/Div_1_output_0$/blocks.16/self_attn/Cast_2_output_0/blocks.16/self_attn/Cast_2"Cast* to z $/blocks.16/self_attn/Cast_2_output_0$/blocks.16/self_attn/Cast_3_output_0/blocks.16/self_attn/Cast_3"Cast* to )/blocks.16/self_attn/Constant_20_output_0 /blocks.16/self_attn/Constant_20"Constant*H value*<B,/blocks.16/self_attn/Constant_20_attr::valueJ )/blocks.16/self_attn/Constant_21_output_0 /blocks.16/self_attn/Constant_21"Constant*H value*<B,/blocks.16/self_attn/Constant_21_attr::valueJ )/blocks.16/self_attn/Constant_22_output_0 /blocks.16/self_attn/Constant_22"Constant*H value*<B,/blocks.16/self_attn/Constant_22_attr::valueJ  $/blocks.16/self_attn/Cast_3_output_0 )/blocks.16/self_attn/Constant_22_output_0)/blocks.16/self_attn/Unsqueeze_8_output_0 /blocks.16/self_attn/Unsqueeze_8" Unsqueeze )/blocks.16/self_attn/Constant_23_output_0 /blocks.16/self_attn/Constant_23"Constant*H value*<B,/blocks.16/self_attn/Constant_23_attr::valueJ  +/blocks.16/self_attn/k_norm/Cast_2_output_0 )/blocks.16/self_attn/Constant_21_output_0 )/blocks.16/self_attn/Unsqueeze_8_output_0 )/blocks.16/self_attn/Constant_20_output_0 )/blocks.16/self_attn/Constant_23_output_0%/blocks.16/self_attn/Slice_2_output_0/blocks.16/self_attn/Slice_2"Slice )/blocks.16/self_attn/Constant_24_output_0 /blocks.16/self_attn/Constant_24"Constant*H value*<B,/blocks.16/self_attn/Constant_24_attr::valueJ )/blocks.16/self_attn/Constant_25_output_0 /blocks.16/self_attn/Constant_25"Constant*H value*<B,/blocks.16/self_attn/Constant_25_attr::valueJ  $/blocks.16/self_attn/Cast_3_output_0 )/blocks.16/self_attn/Constant_25_output_0)/blocks.16/self_attn/Unsqueeze_9_output_0 /blocks.16/self_attn/Unsqueeze_9" Unsqueeze )/blocks.16/self_attn/Constant_26_output_0 /blocks.16/self_attn/Constant_26"Constant*H value*<B,/blocks.16/self_attn/Constant_26_attr::valueJ )/blocks.16/self_attn/Constant_27_output_0 /blocks.16/self_attn/Constant_27"Constant*H value*<B,/blocks.16/self_attn/Constant_27_attr::valueJ  +/blocks.16/self_attn/k_norm/Cast_2_output_0 )/blocks.16/self_attn/Unsqueeze_9_output_0 )/blocks.16/self_attn/Constant_26_output_0 )/blocks.16/self_attn/Constant_24_output_0 )/blocks.16/self_attn/Constant_27_output_0%/blocks.16/self_attn/Slice_3_output_0/blocks.16/self_attn/Slice_3"Slice m %/blocks.16/self_attn/Slice_3_output_0#/blocks.16/self_attn/Neg_1_output_0/blocks.16/self_attn/Neg_1"Neg  #/blocks.16/self_attn/Neg_1_output_0 %/blocks.16/self_attn/Slice_2_output_0&/blocks.16/self_attn/Concat_4_output_0/blocks.16/self_attn/Concat_4"Concat* axis  &/blocks.16/self_attn/Concat_4_output_0 %/blocks.0/self_attn/Gather_3_output_0#/blocks.16/self_attn/Mul_3_output_0/blocks.16/self_attn/Mul_3"Mul  #/blocks.16/self_attn/Mul_2_output_0 #/blocks.16/self_attn/Mul_3_output_0#/blocks.16/self_attn/Add_1_output_0/blocks.16/self_attn/Add_1"Add  /Gather_16_output_0 /rotary/Constant_3_output_0&/blocks.16/self_attn/Gather_4_output_0/blocks.16/self_attn/Gather_4"Gather* axis  /Gather_16_output_0 /rotary/Constant_8_output_0&/blocks.16/self_attn/Gather_5_output_0/blocks.16/self_attn/Gather_5"Gather* axis  &/blocks.16/self_attn/Gather_4_output_0 #/blocks.16/self_attn/Add_1_output_0&/blocks.16/self_attn/Concat_5_output_0/blocks.16/self_attn/Concat_5"Concat* axis  &/blocks.16/self_attn/Gather_5_output_0 '/blocks.16/self_attn/Reshape_2_output_0&/blocks.16/self_attn/Concat_6_output_0/blocks.16/self_attn/Concat_6"Concat* axis )/blocks.16/self_attn/Constant_28_output_0 /blocks.16/self_attn/Constant_28"Constant*H value*<B,/blocks.16/self_attn/Constant_28_attr::valueJ  &/blocks.16/self_attn/Concat_5_output_0 )/blocks.16/self_attn/Constant_28_output_0*/blocks.16/self_attn/Unsqueeze_10_output_0!/blocks.16/self_attn/Unsqueeze_10" Unsqueeze )/blocks.16/self_attn/Constant_29_output_0 /blocks.16/self_attn/Constant_29"Constant*H value*<B,/blocks.16/self_attn/Constant_29_attr::valueJ  &/blocks.16/self_attn/Concat_6_output_0 )/blocks.16/self_attn/Constant_29_output_0*/blocks.16/self_attn/Unsqueeze_11_output_0!/blocks.16/self_attn/Unsqueeze_11" Unsqueeze  */blocks.16/self_attn/Unsqueeze_10_output_0 */blocks.16/self_attn/Unsqueeze_11_output_0&/blocks.16/self_attn/Concat_7_output_0/blocks.16/self_attn/Concat_7"Concat* axis  !/blocks.16/self_attn/Add_output_0'/blocks.16/self_attn/Transpose_output_0/blocks.16/self_attn/Transpose" Transpose* perm@@@@  &/blocks.16/self_attn/Concat_5_output_0)/blocks.16/self_attn/Transpose_1_output_0 /blocks.16/self_attn/Transpose_1" Transpose* perm@@@@  &/blocks.16/self_attn/Concat_6_output_0)/blocks.16/self_attn/Transpose_2_output_0 /blocks.16/self_attn/Transpose_2" Transpose* perm@@@@ w )/blocks.16/self_attn/Transpose_1_output_0%/blocks.16/self_attn/Shape_4_output_0/blocks.16/self_attn/Shape_4"Shape )/blocks.16/self_attn/Constant_30_output_0 /blocks.16/self_attn/Constant_30"Constant*F value*:B,/blocks.16/self_attn/Constant_30_attr::valueJ  %/blocks.16/self_attn/Shape_4_output_0 )/blocks.16/self_attn/Constant_30_output_0&/blocks.16/self_attn/Gather_6_output_0/blocks.16/self_attn/Gather_6"Gather* axis w )/blocks.16/self_attn/Transpose_1_output_0%/blocks.16/self_attn/Shape_5_output_0/blocks.16/self_attn/Shape_5"Shape )/blocks.16/self_attn/Constant_31_output_0 /blocks.16/self_attn/Constant_31"Constant*F value*:B,/blocks.16/self_attn/Constant_31_attr::valueJ  %/blocks.16/self_attn/Shape_5_output_0 )/blocks.16/self_attn/Constant_31_output_0&/blocks.16/self_attn/Gather_7_output_0/blocks.16/self_attn/Gather_7"Gather* axis w )/blocks.16/self_attn/Transpose_1_output_0%/blocks.16/self_attn/Shape_6_output_0/blocks.16/self_attn/Shape_6"Shape )/blocks.16/self_attn/Constant_32_output_0 /blocks.16/self_attn/Constant_32"Constant*F value*:B,/blocks.16/self_attn/Constant_32_attr::valueJ  %/blocks.16/self_attn/Shape_6_output_0 )/blocks.16/self_attn/Constant_32_output_0&/blocks.16/self_attn/Gather_8_output_0/blocks.16/self_attn/Gather_8"Gather* axis w )/blocks.16/self_attn/Transpose_1_output_0%/blocks.16/self_attn/Shape_7_output_0/blocks.16/self_attn/Shape_7"Shape )/blocks.16/self_attn/Constant_33_output_0 /blocks.16/self_attn/Constant_33"Constant*F value*:B,/blocks.16/self_attn/Constant_33_attr::valueJ  %/blocks.16/self_attn/Shape_7_output_0 )/blocks.16/self_attn/Constant_33_output_0&/blocks.16/self_attn/Gather_9_output_0/blocks.16/self_attn/Gather_9"Gather* axis )/blocks.16/self_attn/Constant_34_output_0 /blocks.16/self_attn/Constant_34"Constant*H value*<B,/blocks.16/self_attn/Constant_34_attr::valueJ  )/blocks.16/self_attn/Transpose_1_output_0 )/blocks.16/self_attn/Constant_34_output_0*/blocks.16/self_attn/Unsqueeze_12_output_0!/blocks.16/self_attn/Unsqueeze_12" Unsqueeze )/blocks.16/self_attn/Constant_35_output_0 /blocks.16/self_attn/Constant_35"Constant*H value*<B,/blocks.16/self_attn/Constant_35_attr::valueJ  &/blocks.16/self_attn/Gather_6_output_0 )/blocks.16/self_attn/Constant_35_output_0*/blocks.16/self_attn/Unsqueeze_13_output_0!/blocks.16/self_attn/Unsqueeze_13" Unsqueeze )/blocks.16/self_attn/Constant_36_output_0 /blocks.16/self_attn/Constant_36"Constant*H value*<B,/blocks.16/self_attn/Constant_36_attr::valueJ  &/blocks.16/self_attn/Gather_7_output_0 )/blocks.16/self_attn/Constant_36_output_0*/blocks.16/self_attn/Unsqueeze_14_output_0!/blocks.16/self_attn/Unsqueeze_14" Unsqueeze )/blocks.16/self_attn/Constant_37_output_0 /blocks.16/self_attn/Constant_37"Constant*H value*<B,/blocks.16/self_attn/Constant_37_attr::valueJ )/blocks.16/self_attn/Constant_38_output_0 /blocks.16/self_attn/Constant_38"Constant*H value*<B,/blocks.16/self_attn/Constant_38_attr::valueJ  &/blocks.16/self_attn/Gather_8_output_0 )/blocks.16/self_attn/Constant_38_output_0*/blocks.16/self_attn/Unsqueeze_15_output_0!/blocks.16/self_attn/Unsqueeze_15" Unsqueeze )/blocks.16/self_attn/Constant_39_output_0 /blocks.16/self_attn/Constant_39"Constant*H value*<B,/blocks.16/self_attn/Constant_39_attr::valueJ  &/blocks.16/self_attn/Gather_9_output_0 )/blocks.16/self_attn/Constant_39_output_0*/blocks.16/self_attn/Unsqueeze_16_output_0!/blocks.16/self_attn/Unsqueeze_16" Unsqueeze  */blocks.16/self_attn/Unsqueeze_13_output_0 */blocks.16/self_attn/Unsqueeze_14_output_0 )/blocks.16/self_attn/Constant_37_output_0 */blocks.16/self_attn/Unsqueeze_15_output_0 */blocks.16/self_attn/Unsqueeze_16_output_0&/blocks.16/self_attn/Concat_8_output_0/blocks.16/self_attn/Concat_8"Concat* axis )/blocks.16/self_attn/Constant_40_output_0 /blocks.16/self_attn/Constant_40"Constant*H value*<B,/blocks.16/self_attn/Constant_40_attr::valueJ  &/blocks.16/self_attn/Concat_8_output_0 )/blocks.16/self_attn/Constant_40_output_0'/blocks.16/self_attn/Reshape_3_output_0/blocks.16/self_attn/Reshape_3"Reshape* allowzero u '/blocks.16/self_attn/Reshape_3_output_0%/blocks.16/self_attn/Shape_8_output_0/blocks.16/self_attn/Shape_8"Shape  %/blocks.16/self_attn/Shape_8_output_0-/blocks.16/self_attn/ConstantOfShape_output_0$/blocks.16/self_attn/ConstantOfShape"ConstantOfShape*L value*@B0/blocks.16/self_attn/ConstantOfShape_attr::valueJ )/blocks.16/self_attn/Constant_41_output_0 /blocks.16/self_attn/Constant_41"Constant*F value*:B,/blocks.16/self_attn/Constant_41_attr::valueJ  -/blocks.16/self_attn/ConstantOfShape_output_0 )/blocks.16/self_attn/Constant_41_output_0#/blocks.16/self_attn/Mul_4_output_0/blocks.16/self_attn/Mul_4"Mul  '/blocks.16/self_attn/Reshape_3_output_0 #/blocks.16/self_attn/Mul_4_output_0#/blocks.16/self_attn/Equal_output_0/blocks.16/self_attn/Equal"Equal  #/blocks.16/self_attn/Equal_output_0 -/blocks.16/self_attn/ConstantOfShape_output_0 '/blocks.16/self_attn/Reshape_3_output_0#/blocks.16/self_attn/Where_output_0/blocks.16/self_attn/Where"Where  */blocks.16/self_attn/Unsqueeze_12_output_0 #/blocks.16/self_attn/Where_output_0$/blocks.16/self_attn/Expand_output_0/blocks.16/self_attn/Expand"Expand )/blocks.16/self_attn/Constant_42_output_0 /blocks.16/self_attn/Constant_42"Constant*F value*:B,/blocks.16/self_attn/Constant_42_attr::valueJ  &/blocks.16/self_attn/Gather_7_output_0 )/blocks.16/self_attn/Constant_42_output_0#/blocks.16/self_attn/Mul_5_output_0/blocks.16/self_attn/Mul_5"Mul fonnx::Unsqueeze_5187 Constant_6902"Constant*5 value*)BConstant_6902_attr::valueJ  &/blocks.16/self_attn/Gather_6_output_0 onnx::Unsqueeze_5187*/blocks.16/self_attn/Unsqueeze_17_output_0!/blocks.16/self_attn/Unsqueeze_17" Unsqueeze fonnx::Unsqueeze_5189 Constant_6904"Constant*5 value*)BConstant_6904_attr::valueJ  #/blocks.16/self_attn/Mul_5_output_0 onnx::Unsqueeze_5189*/blocks.16/self_attn/Unsqueeze_18_output_0!/blocks.16/self_attn/Unsqueeze_18" Unsqueeze fonnx::Unsqueeze_5191 Constant_6906"Constant*5 value*)BConstant_6906_attr::valueJ  &/blocks.16/self_attn/Gather_8_output_0 onnx::Unsqueeze_5191*/blocks.16/self_attn/Unsqueeze_19_output_0!/blocks.16/self_attn/Unsqueeze_19" Unsqueeze fonnx::Unsqueeze_5193 Constant_6908"Constant*5 value*)BConstant_6908_attr::valueJ  &/blocks.16/self_attn/Gather_9_output_0 onnx::Unsqueeze_5193*/blocks.16/self_attn/Unsqueeze_20_output_0!/blocks.16/self_attn/Unsqueeze_20" Unsqueeze  */blocks.16/self_attn/Unsqueeze_17_output_0 */blocks.16/self_attn/Unsqueeze_18_output_0 */blocks.16/self_attn/Unsqueeze_19_output_0 */blocks.16/self_attn/Unsqueeze_20_output_0&/blocks.16/self_attn/Concat_9_output_0/blocks.16/self_attn/Concat_9"Concat* axis  $/blocks.16/self_attn/Expand_output_0 &/blocks.16/self_attn/Concat_9_output_0'/blocks.16/self_attn/Reshape_4_output_0/blocks.16/self_attn/Reshape_4"Reshape* allowzero w )/blocks.16/self_attn/Transpose_2_output_0%/blocks.16/self_attn/Shape_9_output_0/blocks.16/self_attn/Shape_9"Shape )/blocks.16/self_attn/Constant_43_output_0 /blocks.16/self_attn/Constant_43"Constant*F value*:B,/blocks.16/self_attn/Constant_43_attr::valueJ  %/blocks.16/self_attn/Shape_9_output_0 )/blocks.16/self_attn/Constant_43_output_0'/blocks.16/self_attn/Gather_10_output_0/blocks.16/self_attn/Gather_10"Gather* axis y )/blocks.16/self_attn/Transpose_2_output_0&/blocks.16/self_attn/Shape_10_output_0/blocks.16/self_attn/Shape_10"Shape )/blocks.16/self_attn/Constant_44_output_0 /blocks.16/self_attn/Constant_44"Constant*F value*:B,/blocks.16/self_attn/Constant_44_attr::valueJ  &/blocks.16/self_attn/Shape_10_output_0 )/blocks.16/self_attn/Constant_44_output_0'/blocks.16/self_attn/Gather_11_output_0/blocks.16/self_attn/Gather_11"Gather* axis y )/blocks.16/self_attn/Transpose_2_output_0&/blocks.16/self_attn/Shape_11_output_0/blocks.16/self_attn/Shape_11"Shape )/blocks.16/self_attn/Constant_45_output_0 /blocks.16/self_attn/Constant_45"Constant*F value*:B,/blocks.16/self_attn/Constant_45_attr::valueJ  &/blocks.16/self_attn/Shape_11_output_0 )/blocks.16/self_attn/Constant_45_output_0'/blocks.16/self_attn/Gather_12_output_0/blocks.16/self_attn/Gather_12"Gather* axis y )/blocks.16/self_attn/Transpose_2_output_0&/blocks.16/self_attn/Shape_12_output_0/blocks.16/self_attn/Shape_12"Shape )/blocks.16/self_attn/Constant_46_output_0 /blocks.16/self_attn/Constant_46"Constant*F value*:B,/blocks.16/self_attn/Constant_46_attr::valueJ  &/blocks.16/self_attn/Shape_12_output_0 )/blocks.16/self_attn/Constant_46_output_0'/blocks.16/self_attn/Gather_13_output_0/blocks.16/self_attn/Gather_13"Gather* axis )/blocks.16/self_attn/Constant_47_output_0 /blocks.16/self_attn/Constant_47"Constant*H value*<B,/blocks.16/self_attn/Constant_47_attr::valueJ  )/blocks.16/self_attn/Transpose_2_output_0 )/blocks.16/self_attn/Constant_47_output_0*/blocks.16/self_attn/Unsqueeze_21_output_0!/blocks.16/self_attn/Unsqueeze_21" Unsqueeze )/blocks.16/self_attn/Constant_48_output_0 /blocks.16/self_attn/Constant_48"Constant*H value*<B,/blocks.16/self_attn/Constant_48_attr::valueJ  '/blocks.16/self_attn/Gather_10_output_0 )/blocks.16/self_attn/Constant_48_output_0*/blocks.16/self_attn/Unsqueeze_22_output_0!/blocks.16/self_attn/Unsqueeze_22" Unsqueeze )/blocks.16/self_attn/Constant_49_output_0 /blocks.16/self_attn/Constant_49"Constant*H value*<B,/blocks.16/self_attn/Constant_49_attr::valueJ  '/blocks.16/self_attn/Gather_11_output_0 )/blocks.16/self_attn/Constant_49_output_0*/blocks.16/self_attn/Unsqueeze_23_output_0!/blocks.16/self_attn/Unsqueeze_23" Unsqueeze )/blocks.16/self_attn/Constant_50_output_0 /blocks.16/self_attn/Constant_50"Constant*H value*<B,/blocks.16/self_attn/Constant_50_attr::valueJ )/blocks.16/self_attn/Constant_51_output_0 /blocks.16/self_attn/Constant_51"Constant*H value*<B,/blocks.16/self_attn/Constant_51_attr::valueJ  '/blocks.16/self_attn/Gather_12_output_0 )/blocks.16/self_attn/Constant_51_output_0*/blocks.16/self_attn/Unsqueeze_24_output_0!/blocks.16/self_attn/Unsqueeze_24" Unsqueeze )/blocks.16/self_attn/Constant_52_output_0 /blocks.16/self_attn/Constant_52"Constant*H value*<B,/blocks.16/self_attn/Constant_52_attr::valueJ  '/blocks.16/self_attn/Gather_13_output_0 )/blocks.16/self_attn/Constant_52_output_0*/blocks.16/self_attn/Unsqueeze_25_output_0!/blocks.16/self_attn/Unsqueeze_25" Unsqueeze  */blocks.16/self_attn/Unsqueeze_22_output_0 */blocks.16/self_attn/Unsqueeze_23_output_0 )/blocks.16/self_attn/Constant_50_output_0 */blocks.16/self_attn/Unsqueeze_24_output_0 */blocks.16/self_attn/Unsqueeze_25_output_0'/blocks.16/self_attn/Concat_10_output_0/blocks.16/self_attn/Concat_10"Concat* axis )/blocks.16/self_attn/Constant_53_output_0 /blocks.16/self_attn/Constant_53"Constant*H value*<B,/blocks.16/self_attn/Constant_53_attr::valueJ  '/blocks.16/self_attn/Concat_10_output_0 )/blocks.16/self_attn/Constant_53_output_0'/blocks.16/self_attn/Reshape_5_output_0/blocks.16/self_attn/Reshape_5"Reshape* allowzero w '/blocks.16/self_attn/Reshape_5_output_0&/blocks.16/self_attn/Shape_13_output_0/blocks.16/self_attn/Shape_13"Shape  &/blocks.16/self_attn/Shape_13_output_0//blocks.16/self_attn/ConstantOfShape_1_output_0&/blocks.16/self_attn/ConstantOfShape_1"ConstantOfShape*N value*BB2/blocks.16/self_attn/ConstantOfShape_1_attr::valueJ )/blocks.16/self_attn/Constant_54_output_0 /blocks.16/self_attn/Constant_54"Constant*F value*:B,/blocks.16/self_attn/Constant_54_attr::valueJ  //blocks.16/self_attn/ConstantOfShape_1_output_0 )/blocks.16/self_attn/Constant_54_output_0#/blocks.16/self_attn/Mul_6_output_0/blocks.16/self_attn/Mul_6"Mul  '/blocks.16/self_attn/Reshape_5_output_0 #/blocks.16/self_attn/Mul_6_output_0%/blocks.16/self_attn/Equal_1_output_0/blocks.16/self_attn/Equal_1"Equal  %/blocks.16/self_attn/Equal_1_output_0 //blocks.16/self_attn/ConstantOfShape_1_output_0 '/blocks.16/self_attn/Reshape_5_output_0%/blocks.16/self_attn/Where_1_output_0/blocks.16/self_attn/Where_1"Where  */blocks.16/self_attn/Unsqueeze_21_output_0 %/blocks.16/self_attn/Where_1_output_0&/blocks.16/self_attn/Expand_1_output_0/blocks.16/self_attn/Expand_1"Expand )/blocks.16/self_attn/Constant_55_output_0 /blocks.16/self_attn/Constant_55"Constant*F value*:B,/blocks.16/self_attn/Constant_55_attr::valueJ  '/blocks.16/self_attn/Gather_11_output_0 )/blocks.16/self_attn/Constant_55_output_0#/blocks.16/self_attn/Mul_7_output_0/blocks.16/self_attn/Mul_7"Mul fonnx::Unsqueeze_5233 Constant_6947"Constant*5 value*)BConstant_6947_attr::valueJ  '/blocks.16/self_attn/Gather_10_output_0 onnx::Unsqueeze_5233*/blocks.16/self_attn/Unsqueeze_26_output_0!/blocks.16/self_attn/Unsqueeze_26" Unsqueeze fonnx::Unsqueeze_5235 Constant_6949"Constant*5 value*)BConstant_6949_attr::valueJ  #/blocks.16/self_attn/Mul_7_output_0 onnx::Unsqueeze_5235*/blocks.16/self_attn/Unsqueeze_27_output_0!/blocks.16/self_attn/Unsqueeze_27" Unsqueeze fonnx::Unsqueeze_5237 Constant_6951"Constant*5 value*)BConstant_6951_attr::valueJ  '/blocks.16/self_attn/Gather_12_output_0 onnx::Unsqueeze_5237*/blocks.16/self_attn/Unsqueeze_28_output_0!/blocks.16/self_attn/Unsqueeze_28" Unsqueeze fonnx::Unsqueeze_5239 Constant_6953"Constant*5 value*)BConstant_6953_attr::valueJ  '/blocks.16/self_attn/Gather_13_output_0 onnx::Unsqueeze_5239*/blocks.16/self_attn/Unsqueeze_29_output_0!/blocks.16/self_attn/Unsqueeze_29" Unsqueeze  */blocks.16/self_attn/Unsqueeze_26_output_0 */blocks.16/self_attn/Unsqueeze_27_output_0 */blocks.16/self_attn/Unsqueeze_28_output_0 */blocks.16/self_attn/Unsqueeze_29_output_0'/blocks.16/self_attn/Concat_11_output_0/blocks.16/self_attn/Concat_11"Concat* axis  &/blocks.16/self_attn/Expand_1_output_0 '/blocks.16/self_attn/Concat_11_output_0'/blocks.16/self_attn/Reshape_6_output_0/blocks.16/self_attn/Reshape_6"Reshape* allowzero  '/blocks.16/self_attn/Transpose_output_0 '/blocks.16/self_attn/Reshape_4_output_0$/blocks.16/self_attn/MatMul_output_0/blocks.16/self_attn/MatMul"MatMul )/blocks.16/self_attn/Constant_56_output_0 /blocks.16/self_attn/Constant_56"Constant*B value*6B,/blocks.16/self_attn/Constant_56_attr::valueJ5A  $/blocks.16/self_attn/MatMul_output_0 )/blocks.16/self_attn/Constant_56_output_0#/blocks.16/self_attn/Div_2_output_0/blocks.16/self_attn/Div_2"Div { #/blocks.16/self_attn/Div_2_output_0 attention_mask#/blocks.16/self_attn/Add_2_output_0/blocks.16/self_attn/Add_2"Add  #/blocks.16/self_attn/Add_2_output_0%/blocks.16/self_attn/Softmax_output_0/blocks.16/self_attn/Softmax"Softmax* axis { %/blocks.16/self_attn/Softmax_output_0$/blocks.16/self_attn/Cast_4_output_0/blocks.16/self_attn/Cast_4"Cast* to  $/blocks.16/self_attn/Cast_4_output_0 '/blocks.16/self_attn/Reshape_6_output_0&/blocks.16/self_attn/MatMul_1_output_0/blocks.16/self_attn/MatMul_1"MatMul  &/blocks.16/self_attn/MatMul_1_output_0)/blocks.16/self_attn/Transpose_3_output_0 /blocks.16/self_attn/Transpose_3" Transpose* perm@@@@ fonnx::Unsqueeze_5251 Constant_6965"Constant*5 value*)BConstant_6965_attr::valueJ  $/blocks.16/self_attn/Gather_output_0 onnx::Unsqueeze_5251*/blocks.16/self_attn/Unsqueeze_30_output_0!/blocks.16/self_attn/Unsqueeze_30" Unsqueeze fonnx::Unsqueeze_5253 Constant_6967"Constant*5 value*)BConstant_6967_attr::valueJ  &/blocks.16/self_attn/Gather_1_output_0 onnx::Unsqueeze_5253*/blocks.16/self_attn/Unsqueeze_31_output_0!/blocks.16/self_attn/Unsqueeze_31" Unsqueeze )/blocks.16/self_attn/Constant_57_output_0 /blocks.16/self_attn/Constant_57"Constant*H value*<B,/blocks.16/self_attn/Constant_57_attr::valueJ  */blocks.16/self_attn/Unsqueeze_30_output_0 */blocks.16/self_attn/Unsqueeze_31_output_0 )/blocks.16/self_attn/Constant_57_output_0'/blocks.16/self_attn/Concat_12_output_0/blocks.16/self_attn/Concat_12"Concat* axis  )/blocks.16/self_attn/Transpose_3_output_0 '/blocks.16/self_attn/Concat_12_output_0'/blocks.16/self_attn/Reshape_7_output_0/blocks.16/self_attn/Reshape_7"Reshape* allowzero  '/blocks.16/self_attn/Reshape_7_output_0 onnx::MatMul_9037+/blocks.16/self_attn/o_proj/MatMul_output_0"/blocks.16/self_attn/o_proj/MatMul"MatMul  */blocks.16/input_layernorm/Cast_1_output_0 +/blocks.16/self_attn/o_proj/MatMul_output_0/blocks.16/Add_output_0/blocks.16/Add"Add  /blocks.16/Add_output_01/blocks.16/post_attention_layernorm/Cast_output_0(/blocks.16/post_attention_layernorm/Cast"Cast* to 5/blocks.16/post_attention_layernorm/Constant_output_0,/blocks.16/post_attention_layernorm/Constant"Constant*N value*BB8/blocks.16/post_attention_layernorm/Constant_attr::valueJ@  1/blocks.16/post_attention_layernorm/Cast_output_0 5/blocks.16/post_attention_layernorm/Constant_output_00/blocks.16/post_attention_layernorm/Pow_output_0'/blocks.16/post_attention_layernorm/Pow"Pow  0/blocks.16/post_attention_layernorm/Pow_output_07/blocks.16/post_attention_layernorm/ReduceMean_output_0./blocks.16/post_attention_layernorm/ReduceMean" ReduceMean* axes@* keepdims 7/blocks.16/post_attention_layernorm/Constant_1_output_0./blocks.16/post_attention_layernorm/Constant_1"Constant*P value*DB:/blocks.16/post_attention_layernorm/Constant_1_attr::valueJ75  7/blocks.16/post_attention_layernorm/ReduceMean_output_0 7/blocks.16/post_attention_layernorm/Constant_1_output_00/blocks.16/post_attention_layernorm/Add_output_0'/blocks.16/post_attention_layernorm/Add"Add  0/blocks.16/post_attention_layernorm/Add_output_01/blocks.16/post_attention_layernorm/Sqrt_output_0(/blocks.16/post_attention_layernorm/Sqrt"Sqrt 7/blocks.16/post_attention_layernorm/Constant_2_output_0./blocks.16/post_attention_layernorm/Constant_2"Constant*P value*DB:/blocks.16/post_attention_layernorm/Constant_2_attr::valueJ?  7/blocks.16/post_attention_layernorm/Constant_2_output_0 1/blocks.16/post_attention_layernorm/Sqrt_output_00/blocks.16/post_attention_layernorm/Div_output_0'/blocks.16/post_attention_layernorm/Div"Div  1/blocks.16/post_attention_layernorm/Cast_output_03/blocks.16/post_attention_layernorm/Cast_1_output_0*/blocks.16/post_attention_layernorm/Cast_1"Cast* to  3/blocks.16/post_attention_layernorm/Cast_1_output_0 0/blocks.16/post_attention_layernorm/Div_output_00/blocks.16/post_attention_layernorm/Mul_output_0'/blocks.16/post_attention_layernorm/Mul"Mul  0/blocks.16/post_attention_layernorm/Mul_output_0 )blocks.16.post_attention_layernorm.weight2/blocks.16/post_attention_layernorm/Mul_1_output_0)/blocks.16/post_attention_layernorm/Mul_1"Mul  2/blocks.16/post_attention_layernorm/Mul_1_output_03/blocks.16/post_attention_layernorm/Cast_2_output_0*/blocks.16/post_attention_layernorm/Cast_2"Cast* to  3/blocks.16/post_attention_layernorm/Cast_2_output_0 onnx::MatMul_9038(/blocks.16/mlp/gate_proj/MatMul_output_0/blocks.16/mlp/gate_proj/MatMul"MatMul z (/blocks.16/mlp/gate_proj/MatMul_output_0&/blocks.16/mlp/act_fn/Sigmoid_output_0/blocks.16/mlp/act_fn/Sigmoid"Sigmoid  (/blocks.16/mlp/gate_proj/MatMul_output_0 &/blocks.16/mlp/act_fn/Sigmoid_output_0"/blocks.16/mlp/act_fn/Mul_output_0/blocks.16/mlp/act_fn/Mul"Mul  3/blocks.16/post_attention_layernorm/Cast_2_output_0 onnx::MatMul_9039&/blocks.16/mlp/up_proj/MatMul_output_0/blocks.16/mlp/up_proj/MatMul"MatMul  "/blocks.16/mlp/act_fn/Mul_output_0 &/blocks.16/mlp/up_proj/MatMul_output_0/blocks.16/mlp/Mul_output_0/blocks.16/mlp/Mul"Mul  /blocks.16/mlp/Mul_output_0 onnx::MatMul_9040(/blocks.16/mlp/down_proj/MatMul_output_0/blocks.16/mlp/down_proj/MatMul"MatMul  3/blocks.16/post_attention_layernorm/Cast_1_output_0 (/blocks.16/mlp/down_proj/MatMul_output_0/blocks.16/Add_1_output_0/blocks.16/Add_1"Add `/Constant_9_output_0 /Constant_9"Constant*1 value*%B/Constant_9_attr::valueJ ] past_key_values /Constant_9_output_0/Gather_17_output_0 /Gather_17"Gather* axis /blocks.17/Constant_output_0/blocks.17/Constant"Constant*K value*?B/blocks.17/Constant_attr::valueJ  /blocks.16/Add_1_output_0 /blocks.17/Constant_output_0/blocks.17/Reshape_output_0/blocks.17/Reshape"Reshape* allowzero y /blocks.17/Reshape_output_0(/blocks.17/input_layernorm/Cast_output_0/blocks.17/input_layernorm/Cast"Cast* to ,/blocks.17/input_layernorm/Constant_output_0#/blocks.17/input_layernorm/Constant"Constant*E value*9B//blocks.17/input_layernorm/Constant_attr::valueJ@  (/blocks.17/input_layernorm/Cast_output_0 ,/blocks.17/input_layernorm/Constant_output_0'/blocks.17/input_layernorm/Pow_output_0/blocks.17/input_layernorm/Pow"Pow  '/blocks.17/input_layernorm/Pow_output_0./blocks.17/input_layernorm/ReduceMean_output_0%/blocks.17/input_layernorm/ReduceMean" ReduceMean* axes@* keepdims ./blocks.17/input_layernorm/Constant_1_output_0%/blocks.17/input_layernorm/Constant_1"Constant*G value*;B1/blocks.17/input_layernorm/Constant_1_attr::valueJ75  ./blocks.17/input_layernorm/ReduceMean_output_0 ./blocks.17/input_layernorm/Constant_1_output_0'/blocks.17/input_layernorm/Add_output_0/blocks.17/input_layernorm/Add"Add z '/blocks.17/input_layernorm/Add_output_0(/blocks.17/input_layernorm/Sqrt_output_0/blocks.17/input_layernorm/Sqrt"Sqrt ./blocks.17/input_layernorm/Constant_2_output_0%/blocks.17/input_layernorm/Constant_2"Constant*G value*;B1/blocks.17/input_layernorm/Constant_2_attr::valueJ?  ./blocks.17/input_layernorm/Constant_2_output_0 (/blocks.17/input_layernorm/Sqrt_output_0'/blocks.17/input_layernorm/Div_output_0/blocks.17/input_layernorm/Div"Div  (/blocks.17/input_layernorm/Cast_output_0*/blocks.17/input_layernorm/Cast_1_output_0!/blocks.17/input_layernorm/Cast_1"Cast* to  */blocks.17/input_layernorm/Cast_1_output_0 '/blocks.17/input_layernorm/Div_output_0'/blocks.17/input_layernorm/Mul_output_0/blocks.17/input_layernorm/Mul"Mul  '/blocks.17/input_layernorm/Mul_output_0 blocks.17.input_layernorm.weight)/blocks.17/input_layernorm/Mul_1_output_0 /blocks.17/input_layernorm/Mul_1"Mul  )/blocks.17/input_layernorm/Mul_1_output_0*/blocks.17/input_layernorm/Cast_2_output_0!/blocks.17/input_layernorm/Cast_2"Cast* to t */blocks.17/input_layernorm/Cast_2_output_0#/blocks.17/self_attn/Shape_output_0/blocks.17/self_attn/Shape"Shape &/blocks.17/self_attn/Constant_output_0/blocks.17/self_attn/Constant"Constant*C value*7B)/blocks.17/self_attn/Constant_attr::valueJ  #/blocks.17/self_attn/Shape_output_0 &/blocks.17/self_attn/Constant_output_0$/blocks.17/self_attn/Gather_output_0/blocks.17/self_attn/Gather"Gather* axis x */blocks.17/input_layernorm/Cast_2_output_0%/blocks.17/self_attn/Shape_1_output_0/blocks.17/self_attn/Shape_1"Shape (/blocks.17/self_attn/Constant_1_output_0/blocks.17/self_attn/Constant_1"Constant*E value*9B+/blocks.17/self_attn/Constant_1_attr::valueJ  %/blocks.17/self_attn/Shape_1_output_0 (/blocks.17/self_attn/Constant_1_output_0&/blocks.17/self_attn/Gather_1_output_0/blocks.17/self_attn/Gather_1"Gather* axis  */blocks.17/input_layernorm/Cast_2_output_0 onnx::MatMul_9041+/blocks.17/self_attn/q_proj/MatMul_output_0"/blocks.17/self_attn/q_proj/MatMul"MatMul  */blocks.17/input_layernorm/Cast_2_output_0 onnx::MatMul_9042+/blocks.17/self_attn/k_proj/MatMul_output_0"/blocks.17/self_attn/k_proj/MatMul"MatMul  */blocks.17/input_layernorm/Cast_2_output_0 onnx::MatMul_9043+/blocks.17/self_attn/v_proj/MatMul_output_0"/blocks.17/self_attn/v_proj/MatMul"MatMul fonnx::Unsqueeze_5314 Constant_7020"Constant*5 value*)BConstant_7020_attr::valueJ  $/blocks.17/self_attn/Gather_output_0 onnx::Unsqueeze_5314'/blocks.17/self_attn/Unsqueeze_output_0/blocks.17/self_attn/Unsqueeze" Unsqueeze fonnx::Unsqueeze_5316 Constant_7022"Constant*5 value*)BConstant_7022_attr::valueJ  &/blocks.17/self_attn/Gather_1_output_0 onnx::Unsqueeze_5316)/blocks.17/self_attn/Unsqueeze_1_output_0 /blocks.17/self_attn/Unsqueeze_1" Unsqueeze (/blocks.17/self_attn/Constant_2_output_0/blocks.17/self_attn/Constant_2"Constant*G value*;B+/blocks.17/self_attn/Constant_2_attr::valueJ (/blocks.17/self_attn/Constant_3_output_0/blocks.17/self_attn/Constant_3"Constant*G value*;B+/blocks.17/self_attn/Constant_3_attr::valueJ  '/blocks.17/self_attn/Unsqueeze_output_0 )/blocks.17/self_attn/Unsqueeze_1_output_0 (/blocks.17/self_attn/Constant_2_output_0 (/blocks.17/self_attn/Constant_3_output_0$/blocks.17/self_attn/Concat_output_0/blocks.17/self_attn/Concat"Concat* axis  +/blocks.17/self_attn/q_proj/MatMul_output_0 $/blocks.17/self_attn/Concat_output_0%/blocks.17/self_attn/Reshape_output_0/blocks.17/self_attn/Reshape"Reshape* allowzero fonnx::Unsqueeze_5324 Constant_7028"Constant*5 value*)BConstant_7028_attr::valueJ  $/blocks.17/self_attn/Gather_output_0 onnx::Unsqueeze_5324)/blocks.17/self_attn/Unsqueeze_2_output_0 /blocks.17/self_attn/Unsqueeze_2" Unsqueeze fonnx::Unsqueeze_5326 Constant_7030"Constant*5 value*)BConstant_7030_attr::valueJ  &/blocks.17/self_attn/Gather_1_output_0 onnx::Unsqueeze_5326)/blocks.17/self_attn/Unsqueeze_3_output_0 /blocks.17/self_attn/Unsqueeze_3" Unsqueeze (/blocks.17/self_attn/Constant_4_output_0/blocks.17/self_attn/Constant_4"Constant*G value*;B+/blocks.17/self_attn/Constant_4_attr::valueJ (/blocks.17/self_attn/Constant_5_output_0/blocks.17/self_attn/Constant_5"Constant*G value*;B+/blocks.17/self_attn/Constant_5_attr::valueJ  )/blocks.17/self_attn/Unsqueeze_2_output_0 )/blocks.17/self_attn/Unsqueeze_3_output_0 (/blocks.17/self_attn/Constant_4_output_0 (/blocks.17/self_attn/Constant_5_output_0&/blocks.17/self_attn/Concat_1_output_0/blocks.17/self_attn/Concat_1"Concat* axis fonnx::Unsqueeze_5333 Constant_7035"Constant*5 value*)BConstant_7035_attr::valueJ  $/blocks.17/self_attn/Gather_output_0 onnx::Unsqueeze_5333)/blocks.17/self_attn/Unsqueeze_4_output_0 /blocks.17/self_attn/Unsqueeze_4" Unsqueeze fonnx::Unsqueeze_5335 Constant_7037"Constant*5 value*)BConstant_7037_attr::valueJ  &/blocks.17/self_attn/Gather_1_output_0 onnx::Unsqueeze_5335)/blocks.17/self_attn/Unsqueeze_5_output_0 /blocks.17/self_attn/Unsqueeze_5" Unsqueeze (/blocks.17/self_attn/Constant_6_output_0/blocks.17/self_attn/Constant_6"Constant*G value*;B+/blocks.17/self_attn/Constant_6_attr::valueJ (/blocks.17/self_attn/Constant_7_output_0/blocks.17/self_attn/Constant_7"Constant*G value*;B+/blocks.17/self_attn/Constant_7_attr::valueJ  )/blocks.17/self_attn/Unsqueeze_4_output_0 )/blocks.17/self_attn/Unsqueeze_5_output_0 (/blocks.17/self_attn/Constant_6_output_0 (/blocks.17/self_attn/Constant_7_output_0&/blocks.17/self_attn/Concat_2_output_0/blocks.17/self_attn/Concat_2"Concat* axis  +/blocks.17/self_attn/k_proj/MatMul_output_0 &/blocks.17/self_attn/Concat_1_output_0'/blocks.17/self_attn/Reshape_1_output_0/blocks.17/self_attn/Reshape_1"Reshape* allowzero  +/blocks.17/self_attn/v_proj/MatMul_output_0 &/blocks.17/self_attn/Concat_2_output_0'/blocks.17/self_attn/Reshape_2_output_0/blocks.17/self_attn/Reshape_2"Reshape* allowzero  %/blocks.17/self_attn/Reshape_output_0)/blocks.17/self_attn/q_norm/Cast_output_0 /blocks.17/self_attn/q_norm/Cast"Cast* to -/blocks.17/self_attn/q_norm/Constant_output_0$/blocks.17/self_attn/q_norm/Constant"Constant*F value*:B0/blocks.17/self_attn/q_norm/Constant_attr::valueJ@  )/blocks.17/self_attn/q_norm/Cast_output_0 -/blocks.17/self_attn/q_norm/Constant_output_0(/blocks.17/self_attn/q_norm/Pow_output_0/blocks.17/self_attn/q_norm/Pow"Pow  (/blocks.17/self_attn/q_norm/Pow_output_0//blocks.17/self_attn/q_norm/ReduceMean_output_0&/blocks.17/self_attn/q_norm/ReduceMean" ReduceMean* axes@* keepdims //blocks.17/self_attn/q_norm/Constant_1_output_0&/blocks.17/self_attn/q_norm/Constant_1"Constant*H value*<B2/blocks.17/self_attn/q_norm/Constant_1_attr::valueJ75  //blocks.17/self_attn/q_norm/ReduceMean_output_0 //blocks.17/self_attn/q_norm/Constant_1_output_0(/blocks.17/self_attn/q_norm/Add_output_0/blocks.17/self_attn/q_norm/Add"Add } (/blocks.17/self_attn/q_norm/Add_output_0)/blocks.17/self_attn/q_norm/Sqrt_output_0 /blocks.17/self_attn/q_norm/Sqrt"Sqrt //blocks.17/self_attn/q_norm/Constant_2_output_0&/blocks.17/self_attn/q_norm/Constant_2"Constant*H value*<B2/blocks.17/self_attn/q_norm/Constant_2_attr::valueJ?  //blocks.17/self_attn/q_norm/Constant_2_output_0 )/blocks.17/self_attn/q_norm/Sqrt_output_0(/blocks.17/self_attn/q_norm/Div_output_0/blocks.17/self_attn/q_norm/Div"Div  )/blocks.17/self_attn/q_norm/Cast_output_0+/blocks.17/self_attn/q_norm/Cast_1_output_0"/blocks.17/self_attn/q_norm/Cast_1"Cast* to  +/blocks.17/self_attn/q_norm/Cast_1_output_0 (/blocks.17/self_attn/q_norm/Div_output_0(/blocks.17/self_attn/q_norm/Mul_output_0/blocks.17/self_attn/q_norm/Mul"Mul  (/blocks.17/self_attn/q_norm/Mul_output_0 !blocks.17.self_attn.q_norm.weight*/blocks.17/self_attn/q_norm/Mul_1_output_0!/blocks.17/self_attn/q_norm/Mul_1"Mul  */blocks.17/self_attn/q_norm/Mul_1_output_0+/blocks.17/self_attn/q_norm/Cast_2_output_0"/blocks.17/self_attn/q_norm/Cast_2"Cast* to  '/blocks.17/self_attn/Reshape_1_output_0)/blocks.17/self_attn/k_norm/Cast_output_0 /blocks.17/self_attn/k_norm/Cast"Cast* to -/blocks.17/self_attn/k_norm/Constant_output_0$/blocks.17/self_attn/k_norm/Constant"Constant*F value*:B0/blocks.17/self_attn/k_norm/Constant_attr::valueJ@  )/blocks.17/self_attn/k_norm/Cast_output_0 -/blocks.17/self_attn/k_norm/Constant_output_0(/blocks.17/self_attn/k_norm/Pow_output_0/blocks.17/self_attn/k_norm/Pow"Pow  (/blocks.17/self_attn/k_norm/Pow_output_0//blocks.17/self_attn/k_norm/ReduceMean_output_0&/blocks.17/self_attn/k_norm/ReduceMean" ReduceMean* axes@* keepdims //blocks.17/self_attn/k_norm/Constant_1_output_0&/blocks.17/self_attn/k_norm/Constant_1"Constant*H value*<B2/blocks.17/self_attn/k_norm/Constant_1_attr::valueJ75  //blocks.17/self_attn/k_norm/ReduceMean_output_0 //blocks.17/self_attn/k_norm/Constant_1_output_0(/blocks.17/self_attn/k_norm/Add_output_0/blocks.17/self_attn/k_norm/Add"Add } (/blocks.17/self_attn/k_norm/Add_output_0)/blocks.17/self_attn/k_norm/Sqrt_output_0 /blocks.17/self_attn/k_norm/Sqrt"Sqrt //blocks.17/self_attn/k_norm/Constant_2_output_0&/blocks.17/self_attn/k_norm/Constant_2"Constant*H value*<B2/blocks.17/self_attn/k_norm/Constant_2_attr::valueJ?  //blocks.17/self_attn/k_norm/Constant_2_output_0 )/blocks.17/self_attn/k_norm/Sqrt_output_0(/blocks.17/self_attn/k_norm/Div_output_0/blocks.17/self_attn/k_norm/Div"Div  )/blocks.17/self_attn/k_norm/Cast_output_0+/blocks.17/self_attn/k_norm/Cast_1_output_0"/blocks.17/self_attn/k_norm/Cast_1"Cast* to  +/blocks.17/self_attn/k_norm/Cast_1_output_0 (/blocks.17/self_attn/k_norm/Div_output_0(/blocks.17/self_attn/k_norm/Mul_output_0/blocks.17/self_attn/k_norm/Mul"Mul  (/blocks.17/self_attn/k_norm/Mul_output_0 !blocks.17.self_attn.k_norm.weight*/blocks.17/self_attn/k_norm/Mul_1_output_0!/blocks.17/self_attn/k_norm/Mul_1"Mul  */blocks.17/self_attn/k_norm/Mul_1_output_0+/blocks.17/self_attn/k_norm/Cast_2_output_0"/blocks.17/self_attn/k_norm/Cast_2"Cast* to  +/blocks.17/self_attn/q_norm/Cast_2_output_0 %/blocks.0/self_attn/Gather_2_output_0!/blocks.17/self_attn/Mul_output_0/blocks.17/self_attn/Mul"Mul y +/blocks.17/self_attn/q_norm/Cast_2_output_0%/blocks.17/self_attn/Shape_2_output_0/blocks.17/self_attn/Shape_2"Shape (/blocks.17/self_attn/Constant_8_output_0/blocks.17/self_attn/Constant_8"Constant*E value*9B+/blocks.17/self_attn/Constant_8_attr::valueJ  %/blocks.17/self_attn/Shape_2_output_0 (/blocks.17/self_attn/Constant_8_output_0&/blocks.17/self_attn/Gather_2_output_0/blocks.17/self_attn/Gather_2"Gather* axis (/blocks.17/self_attn/Constant_9_output_0/blocks.17/self_attn/Constant_9"Constant*E value*9B+/blocks.17/self_attn/Constant_9_attr::valueJ  &/blocks.17/self_attn/Gather_2_output_0 (/blocks.17/self_attn/Constant_9_output_0!/blocks.17/self_attn/Div_output_0/blocks.17/self_attn/Div"Div s !/blocks.17/self_attn/Div_output_0"/blocks.17/self_attn/Cast_output_0/blocks.17/self_attn/Cast"Cast* to x "/blocks.17/self_attn/Cast_output_0$/blocks.17/self_attn/Cast_1_output_0/blocks.17/self_attn/Cast_1"Cast* to )/blocks.17/self_attn/Constant_10_output_0 /blocks.17/self_attn/Constant_10"Constant*H value*<B,/blocks.17/self_attn/Constant_10_attr::valueJ )/blocks.17/self_attn/Constant_11_output_0 /blocks.17/self_attn/Constant_11"Constant*H value*<B,/blocks.17/self_attn/Constant_11_attr::valueJ )/blocks.17/self_attn/Constant_12_output_0 /blocks.17/self_attn/Constant_12"Constant*H value*<B,/blocks.17/self_attn/Constant_12_attr::valueJ  $/blocks.17/self_attn/Cast_1_output_0 )/blocks.17/self_attn/Constant_12_output_0)/blocks.17/self_attn/Unsqueeze_6_output_0 /blocks.17/self_attn/Unsqueeze_6" Unsqueeze )/blocks.17/self_attn/Constant_13_output_0 /blocks.17/self_attn/Constant_13"Constant*H value*<B,/blocks.17/self_attn/Constant_13_attr::valueJ  +/blocks.17/self_attn/q_norm/Cast_2_output_0 )/blocks.17/self_attn/Constant_11_output_0 )/blocks.17/self_attn/Unsqueeze_6_output_0 )/blocks.17/self_attn/Constant_10_output_0 )/blocks.17/self_attn/Constant_13_output_0#/blocks.17/self_attn/Slice_output_0/blocks.17/self_attn/Slice"Slice )/blocks.17/self_attn/Constant_14_output_0 /blocks.17/self_attn/Constant_14"Constant*H value*<B,/blocks.17/self_attn/Constant_14_attr::valueJ )/blocks.17/self_attn/Constant_15_output_0 /blocks.17/self_attn/Constant_15"Constant*H value*<B,/blocks.17/self_attn/Constant_15_attr::valueJ  $/blocks.17/self_attn/Cast_1_output_0 )/blocks.17/self_attn/Constant_15_output_0)/blocks.17/self_attn/Unsqueeze_7_output_0 /blocks.17/self_attn/Unsqueeze_7" Unsqueeze )/blocks.17/self_attn/Constant_16_output_0 /blocks.17/self_attn/Constant_16"Constant*H value*<B,/blocks.17/self_attn/Constant_16_attr::valueJ )/blocks.17/self_attn/Constant_17_output_0 /blocks.17/self_attn/Constant_17"Constant*H value*<B,/blocks.17/self_attn/Constant_17_attr::valueJ  +/blocks.17/self_attn/q_norm/Cast_2_output_0 )/blocks.17/self_attn/Unsqueeze_7_output_0 )/blocks.17/self_attn/Constant_16_output_0 )/blocks.17/self_attn/Constant_14_output_0 )/blocks.17/self_attn/Constant_17_output_0%/blocks.17/self_attn/Slice_1_output_0/blocks.17/self_attn/Slice_1"Slice i %/blocks.17/self_attn/Slice_1_output_0!/blocks.17/self_attn/Neg_output_0/blocks.17/self_attn/Neg"Neg  !/blocks.17/self_attn/Neg_output_0 #/blocks.17/self_attn/Slice_output_0&/blocks.17/self_attn/Concat_3_output_0/blocks.17/self_attn/Concat_3"Concat* axis  &/blocks.17/self_attn/Concat_3_output_0 %/blocks.0/self_attn/Gather_3_output_0#/blocks.17/self_attn/Mul_1_output_0/blocks.17/self_attn/Mul_1"Mul  !/blocks.17/self_attn/Mul_output_0 #/blocks.17/self_attn/Mul_1_output_0!/blocks.17/self_attn/Add_output_0/blocks.17/self_attn/Add"Add  +/blocks.17/self_attn/k_norm/Cast_2_output_0 %/blocks.0/self_attn/Gather_2_output_0#/blocks.17/self_attn/Mul_2_output_0/blocks.17/self_attn/Mul_2"Mul y +/blocks.17/self_attn/k_norm/Cast_2_output_0%/blocks.17/self_attn/Shape_3_output_0/blocks.17/self_attn/Shape_3"Shape )/blocks.17/self_attn/Constant_18_output_0 /blocks.17/self_attn/Constant_18"Constant*F value*:B,/blocks.17/self_attn/Constant_18_attr::valueJ  %/blocks.17/self_attn/Shape_3_output_0 )/blocks.17/self_attn/Constant_18_output_0&/blocks.17/self_attn/Gather_3_output_0/blocks.17/self_attn/Gather_3"Gather* axis )/blocks.17/self_attn/Constant_19_output_0 /blocks.17/self_attn/Constant_19"Constant*F value*:B,/blocks.17/self_attn/Constant_19_attr::valueJ  &/blocks.17/self_attn/Gather_3_output_0 )/blocks.17/self_attn/Constant_19_output_0#/blocks.17/self_attn/Div_1_output_0/blocks.17/self_attn/Div_1"Div y #/blocks.17/self_attn/Div_1_output_0$/blocks.17/self_attn/Cast_2_output_0/blocks.17/self_attn/Cast_2"Cast* to z $/blocks.17/self_attn/Cast_2_output_0$/blocks.17/self_attn/Cast_3_output_0/blocks.17/self_attn/Cast_3"Cast* to )/blocks.17/self_attn/Constant_20_output_0 /blocks.17/self_attn/Constant_20"Constant*H value*<B,/blocks.17/self_attn/Constant_20_attr::valueJ )/blocks.17/self_attn/Constant_21_output_0 /blocks.17/self_attn/Constant_21"Constant*H value*<B,/blocks.17/self_attn/Constant_21_attr::valueJ )/blocks.17/self_attn/Constant_22_output_0 /blocks.17/self_attn/Constant_22"Constant*H value*<B,/blocks.17/self_attn/Constant_22_attr::valueJ  $/blocks.17/self_attn/Cast_3_output_0 )/blocks.17/self_attn/Constant_22_output_0)/blocks.17/self_attn/Unsqueeze_8_output_0 /blocks.17/self_attn/Unsqueeze_8" Unsqueeze )/blocks.17/self_attn/Constant_23_output_0 /blocks.17/self_attn/Constant_23"Constant*H value*<B,/blocks.17/self_attn/Constant_23_attr::valueJ  +/blocks.17/self_attn/k_norm/Cast_2_output_0 )/blocks.17/self_attn/Constant_21_output_0 )/blocks.17/self_attn/Unsqueeze_8_output_0 )/blocks.17/self_attn/Constant_20_output_0 )/blocks.17/self_attn/Constant_23_output_0%/blocks.17/self_attn/Slice_2_output_0/blocks.17/self_attn/Slice_2"Slice )/blocks.17/self_attn/Constant_24_output_0 /blocks.17/self_attn/Constant_24"Constant*H value*<B,/blocks.17/self_attn/Constant_24_attr::valueJ )/blocks.17/self_attn/Constant_25_output_0 /blocks.17/self_attn/Constant_25"Constant*H value*<B,/blocks.17/self_attn/Constant_25_attr::valueJ  $/blocks.17/self_attn/Cast_3_output_0 )/blocks.17/self_attn/Constant_25_output_0)/blocks.17/self_attn/Unsqueeze_9_output_0 /blocks.17/self_attn/Unsqueeze_9" Unsqueeze )/blocks.17/self_attn/Constant_26_output_0 /blocks.17/self_attn/Constant_26"Constant*H value*<B,/blocks.17/self_attn/Constant_26_attr::valueJ )/blocks.17/self_attn/Constant_27_output_0 /blocks.17/self_attn/Constant_27"Constant*H value*<B,/blocks.17/self_attn/Constant_27_attr::valueJ  +/blocks.17/self_attn/k_norm/Cast_2_output_0 )/blocks.17/self_attn/Unsqueeze_9_output_0 )/blocks.17/self_attn/Constant_26_output_0 )/blocks.17/self_attn/Constant_24_output_0 )/blocks.17/self_attn/Constant_27_output_0%/blocks.17/self_attn/Slice_3_output_0/blocks.17/self_attn/Slice_3"Slice m %/blocks.17/self_attn/Slice_3_output_0#/blocks.17/self_attn/Neg_1_output_0/blocks.17/self_attn/Neg_1"Neg  #/blocks.17/self_attn/Neg_1_output_0 %/blocks.17/self_attn/Slice_2_output_0&/blocks.17/self_attn/Concat_4_output_0/blocks.17/self_attn/Concat_4"Concat* axis  &/blocks.17/self_attn/Concat_4_output_0 %/blocks.0/self_attn/Gather_3_output_0#/blocks.17/self_attn/Mul_3_output_0/blocks.17/self_attn/Mul_3"Mul  #/blocks.17/self_attn/Mul_2_output_0 #/blocks.17/self_attn/Mul_3_output_0#/blocks.17/self_attn/Add_1_output_0/blocks.17/self_attn/Add_1"Add  /Gather_17_output_0 /rotary/Constant_3_output_0&/blocks.17/self_attn/Gather_4_output_0/blocks.17/self_attn/Gather_4"Gather* axis  /Gather_17_output_0 /rotary/Constant_8_output_0&/blocks.17/self_attn/Gather_5_output_0/blocks.17/self_attn/Gather_5"Gather* axis  &/blocks.17/self_attn/Gather_4_output_0 #/blocks.17/self_attn/Add_1_output_0&/blocks.17/self_attn/Concat_5_output_0/blocks.17/self_attn/Concat_5"Concat* axis  &/blocks.17/self_attn/Gather_5_output_0 '/blocks.17/self_attn/Reshape_2_output_0&/blocks.17/self_attn/Concat_6_output_0/blocks.17/self_attn/Concat_6"Concat* axis )/blocks.17/self_attn/Constant_28_output_0 /blocks.17/self_attn/Constant_28"Constant*H value*<B,/blocks.17/self_attn/Constant_28_attr::valueJ  &/blocks.17/self_attn/Concat_5_output_0 )/blocks.17/self_attn/Constant_28_output_0*/blocks.17/self_attn/Unsqueeze_10_output_0!/blocks.17/self_attn/Unsqueeze_10" Unsqueeze )/blocks.17/self_attn/Constant_29_output_0 /blocks.17/self_attn/Constant_29"Constant*H value*<B,/blocks.17/self_attn/Constant_29_attr::valueJ  &/blocks.17/self_attn/Concat_6_output_0 )/blocks.17/self_attn/Constant_29_output_0*/blocks.17/self_attn/Unsqueeze_11_output_0!/blocks.17/self_attn/Unsqueeze_11" Unsqueeze  */blocks.17/self_attn/Unsqueeze_10_output_0 */blocks.17/self_attn/Unsqueeze_11_output_0&/blocks.17/self_attn/Concat_7_output_0/blocks.17/self_attn/Concat_7"Concat* axis  !/blocks.17/self_attn/Add_output_0'/blocks.17/self_attn/Transpose_output_0/blocks.17/self_attn/Transpose" Transpose* perm@@@@  &/blocks.17/self_attn/Concat_5_output_0)/blocks.17/self_attn/Transpose_1_output_0 /blocks.17/self_attn/Transpose_1" Transpose* perm@@@@  &/blocks.17/self_attn/Concat_6_output_0)/blocks.17/self_attn/Transpose_2_output_0 /blocks.17/self_attn/Transpose_2" Transpose* perm@@@@ w )/blocks.17/self_attn/Transpose_1_output_0%/blocks.17/self_attn/Shape_4_output_0/blocks.17/self_attn/Shape_4"Shape )/blocks.17/self_attn/Constant_30_output_0 /blocks.17/self_attn/Constant_30"Constant*F value*:B,/blocks.17/self_attn/Constant_30_attr::valueJ  %/blocks.17/self_attn/Shape_4_output_0 )/blocks.17/self_attn/Constant_30_output_0&/blocks.17/self_attn/Gather_6_output_0/blocks.17/self_attn/Gather_6"Gather* axis w )/blocks.17/self_attn/Transpose_1_output_0%/blocks.17/self_attn/Shape_5_output_0/blocks.17/self_attn/Shape_5"Shape )/blocks.17/self_attn/Constant_31_output_0 /blocks.17/self_attn/Constant_31"Constant*F value*:B,/blocks.17/self_attn/Constant_31_attr::valueJ  %/blocks.17/self_attn/Shape_5_output_0 )/blocks.17/self_attn/Constant_31_output_0&/blocks.17/self_attn/Gather_7_output_0/blocks.17/self_attn/Gather_7"Gather* axis w )/blocks.17/self_attn/Transpose_1_output_0%/blocks.17/self_attn/Shape_6_output_0/blocks.17/self_attn/Shape_6"Shape )/blocks.17/self_attn/Constant_32_output_0 /blocks.17/self_attn/Constant_32"Constant*F value*:B,/blocks.17/self_attn/Constant_32_attr::valueJ  %/blocks.17/self_attn/Shape_6_output_0 )/blocks.17/self_attn/Constant_32_output_0&/blocks.17/self_attn/Gather_8_output_0/blocks.17/self_attn/Gather_8"Gather* axis w )/blocks.17/self_attn/Transpose_1_output_0%/blocks.17/self_attn/Shape_7_output_0/blocks.17/self_attn/Shape_7"Shape )/blocks.17/self_attn/Constant_33_output_0 /blocks.17/self_attn/Constant_33"Constant*F value*:B,/blocks.17/self_attn/Constant_33_attr::valueJ  %/blocks.17/self_attn/Shape_7_output_0 )/blocks.17/self_attn/Constant_33_output_0&/blocks.17/self_attn/Gather_9_output_0/blocks.17/self_attn/Gather_9"Gather* axis )/blocks.17/self_attn/Constant_34_output_0 /blocks.17/self_attn/Constant_34"Constant*H value*<B,/blocks.17/self_attn/Constant_34_attr::valueJ  )/blocks.17/self_attn/Transpose_1_output_0 )/blocks.17/self_attn/Constant_34_output_0*/blocks.17/self_attn/Unsqueeze_12_output_0!/blocks.17/self_attn/Unsqueeze_12" Unsqueeze )/blocks.17/self_attn/Constant_35_output_0 /blocks.17/self_attn/Constant_35"Constant*H value*<B,/blocks.17/self_attn/Constant_35_attr::valueJ  &/blocks.17/self_attn/Gather_6_output_0 )/blocks.17/self_attn/Constant_35_output_0*/blocks.17/self_attn/Unsqueeze_13_output_0!/blocks.17/self_attn/Unsqueeze_13" Unsqueeze )/blocks.17/self_attn/Constant_36_output_0 /blocks.17/self_attn/Constant_36"Constant*H value*<B,/blocks.17/self_attn/Constant_36_attr::valueJ  &/blocks.17/self_attn/Gather_7_output_0 )/blocks.17/self_attn/Constant_36_output_0*/blocks.17/self_attn/Unsqueeze_14_output_0!/blocks.17/self_attn/Unsqueeze_14" Unsqueeze )/blocks.17/self_attn/Constant_37_output_0 /blocks.17/self_attn/Constant_37"Constant*H value*<B,/blocks.17/self_attn/Constant_37_attr::valueJ )/blocks.17/self_attn/Constant_38_output_0 /blocks.17/self_attn/Constant_38"Constant*H value*<B,/blocks.17/self_attn/Constant_38_attr::valueJ  &/blocks.17/self_attn/Gather_8_output_0 )/blocks.17/self_attn/Constant_38_output_0*/blocks.17/self_attn/Unsqueeze_15_output_0!/blocks.17/self_attn/Unsqueeze_15" Unsqueeze )/blocks.17/self_attn/Constant_39_output_0 /blocks.17/self_attn/Constant_39"Constant*H value*<B,/blocks.17/self_attn/Constant_39_attr::valueJ  &/blocks.17/self_attn/Gather_9_output_0 )/blocks.17/self_attn/Constant_39_output_0*/blocks.17/self_attn/Unsqueeze_16_output_0!/blocks.17/self_attn/Unsqueeze_16" Unsqueeze  */blocks.17/self_attn/Unsqueeze_13_output_0 */blocks.17/self_attn/Unsqueeze_14_output_0 )/blocks.17/self_attn/Constant_37_output_0 */blocks.17/self_attn/Unsqueeze_15_output_0 */blocks.17/self_attn/Unsqueeze_16_output_0&/blocks.17/self_attn/Concat_8_output_0/blocks.17/self_attn/Concat_8"Concat* axis )/blocks.17/self_attn/Constant_40_output_0 /blocks.17/self_attn/Constant_40"Constant*H value*<B,/blocks.17/self_attn/Constant_40_attr::valueJ  &/blocks.17/self_attn/Concat_8_output_0 )/blocks.17/self_attn/Constant_40_output_0'/blocks.17/self_attn/Reshape_3_output_0/blocks.17/self_attn/Reshape_3"Reshape* allowzero u '/blocks.17/self_attn/Reshape_3_output_0%/blocks.17/self_attn/Shape_8_output_0/blocks.17/self_attn/Shape_8"Shape  %/blocks.17/self_attn/Shape_8_output_0-/blocks.17/self_attn/ConstantOfShape_output_0$/blocks.17/self_attn/ConstantOfShape"ConstantOfShape*L value*@B0/blocks.17/self_attn/ConstantOfShape_attr::valueJ )/blocks.17/self_attn/Constant_41_output_0 /blocks.17/self_attn/Constant_41"Constant*F value*:B,/blocks.17/self_attn/Constant_41_attr::valueJ  -/blocks.17/self_attn/ConstantOfShape_output_0 )/blocks.17/self_attn/Constant_41_output_0#/blocks.17/self_attn/Mul_4_output_0/blocks.17/self_attn/Mul_4"Mul  '/blocks.17/self_attn/Reshape_3_output_0 #/blocks.17/self_attn/Mul_4_output_0#/blocks.17/self_attn/Equal_output_0/blocks.17/self_attn/Equal"Equal  #/blocks.17/self_attn/Equal_output_0 -/blocks.17/self_attn/ConstantOfShape_output_0 '/blocks.17/self_attn/Reshape_3_output_0#/blocks.17/self_attn/Where_output_0/blocks.17/self_attn/Where"Where  */blocks.17/self_attn/Unsqueeze_12_output_0 #/blocks.17/self_attn/Where_output_0$/blocks.17/self_attn/Expand_output_0/blocks.17/self_attn/Expand"Expand )/blocks.17/self_attn/Constant_42_output_0 /blocks.17/self_attn/Constant_42"Constant*F value*:B,/blocks.17/self_attn/Constant_42_attr::valueJ  &/blocks.17/self_attn/Gather_7_output_0 )/blocks.17/self_attn/Constant_42_output_0#/blocks.17/self_attn/Mul_5_output_0/blocks.17/self_attn/Mul_5"Mul fonnx::Unsqueeze_5478 Constant_7165"Constant*5 value*)BConstant_7165_attr::valueJ  &/blocks.17/self_attn/Gather_6_output_0 onnx::Unsqueeze_5478*/blocks.17/self_attn/Unsqueeze_17_output_0!/blocks.17/self_attn/Unsqueeze_17" Unsqueeze fonnx::Unsqueeze_5480 Constant_7167"Constant*5 value*)BConstant_7167_attr::valueJ  #/blocks.17/self_attn/Mul_5_output_0 onnx::Unsqueeze_5480*/blocks.17/self_attn/Unsqueeze_18_output_0!/blocks.17/self_attn/Unsqueeze_18" Unsqueeze fonnx::Unsqueeze_5482 Constant_7169"Constant*5 value*)BConstant_7169_attr::valueJ  &/blocks.17/self_attn/Gather_8_output_0 onnx::Unsqueeze_5482*/blocks.17/self_attn/Unsqueeze_19_output_0!/blocks.17/self_attn/Unsqueeze_19" Unsqueeze fonnx::Unsqueeze_5484 Constant_7171"Constant*5 value*)BConstant_7171_attr::valueJ  &/blocks.17/self_attn/Gather_9_output_0 onnx::Unsqueeze_5484*/blocks.17/self_attn/Unsqueeze_20_output_0!/blocks.17/self_attn/Unsqueeze_20" Unsqueeze  */blocks.17/self_attn/Unsqueeze_17_output_0 */blocks.17/self_attn/Unsqueeze_18_output_0 */blocks.17/self_attn/Unsqueeze_19_output_0 */blocks.17/self_attn/Unsqueeze_20_output_0&/blocks.17/self_attn/Concat_9_output_0/blocks.17/self_attn/Concat_9"Concat* axis  $/blocks.17/self_attn/Expand_output_0 &/blocks.17/self_attn/Concat_9_output_0'/blocks.17/self_attn/Reshape_4_output_0/blocks.17/self_attn/Reshape_4"Reshape* allowzero w )/blocks.17/self_attn/Transpose_2_output_0%/blocks.17/self_attn/Shape_9_output_0/blocks.17/self_attn/Shape_9"Shape )/blocks.17/self_attn/Constant_43_output_0 /blocks.17/self_attn/Constant_43"Constant*F value*:B,/blocks.17/self_attn/Constant_43_attr::valueJ  %/blocks.17/self_attn/Shape_9_output_0 )/blocks.17/self_attn/Constant_43_output_0'/blocks.17/self_attn/Gather_10_output_0/blocks.17/self_attn/Gather_10"Gather* axis y )/blocks.17/self_attn/Transpose_2_output_0&/blocks.17/self_attn/Shape_10_output_0/blocks.17/self_attn/Shape_10"Shape )/blocks.17/self_attn/Constant_44_output_0 /blocks.17/self_attn/Constant_44"Constant*F value*:B,/blocks.17/self_attn/Constant_44_attr::valueJ  &/blocks.17/self_attn/Shape_10_output_0 )/blocks.17/self_attn/Constant_44_output_0'/blocks.17/self_attn/Gather_11_output_0/blocks.17/self_attn/Gather_11"Gather* axis y )/blocks.17/self_attn/Transpose_2_output_0&/blocks.17/self_attn/Shape_11_output_0/blocks.17/self_attn/Shape_11"Shape )/blocks.17/self_attn/Constant_45_output_0 /blocks.17/self_attn/Constant_45"Constant*F value*:B,/blocks.17/self_attn/Constant_45_attr::valueJ  &/blocks.17/self_attn/Shape_11_output_0 )/blocks.17/self_attn/Constant_45_output_0'/blocks.17/self_attn/Gather_12_output_0/blocks.17/self_attn/Gather_12"Gather* axis y )/blocks.17/self_attn/Transpose_2_output_0&/blocks.17/self_attn/Shape_12_output_0/blocks.17/self_attn/Shape_12"Shape )/blocks.17/self_attn/Constant_46_output_0 /blocks.17/self_attn/Constant_46"Constant*F value*:B,/blocks.17/self_attn/Constant_46_attr::valueJ  &/blocks.17/self_attn/Shape_12_output_0 )/blocks.17/self_attn/Constant_46_output_0'/blocks.17/self_attn/Gather_13_output_0/blocks.17/self_attn/Gather_13"Gather* axis )/blocks.17/self_attn/Constant_47_output_0 /blocks.17/self_attn/Constant_47"Constant*H value*<B,/blocks.17/self_attn/Constant_47_attr::valueJ  )/blocks.17/self_attn/Transpose_2_output_0 )/blocks.17/self_attn/Constant_47_output_0*/blocks.17/self_attn/Unsqueeze_21_output_0!/blocks.17/self_attn/Unsqueeze_21" Unsqueeze )/blocks.17/self_attn/Constant_48_output_0 /blocks.17/self_attn/Constant_48"Constant*H value*<B,/blocks.17/self_attn/Constant_48_attr::valueJ  '/blocks.17/self_attn/Gather_10_output_0 )/blocks.17/self_attn/Constant_48_output_0*/blocks.17/self_attn/Unsqueeze_22_output_0!/blocks.17/self_attn/Unsqueeze_22" Unsqueeze )/blocks.17/self_attn/Constant_49_output_0 /blocks.17/self_attn/Constant_49"Constant*H value*<B,/blocks.17/self_attn/Constant_49_attr::valueJ  '/blocks.17/self_attn/Gather_11_output_0 )/blocks.17/self_attn/Constant_49_output_0*/blocks.17/self_attn/Unsqueeze_23_output_0!/blocks.17/self_attn/Unsqueeze_23" Unsqueeze )/blocks.17/self_attn/Constant_50_output_0 /blocks.17/self_attn/Constant_50"Constant*H value*<B,/blocks.17/self_attn/Constant_50_attr::valueJ )/blocks.17/self_attn/Constant_51_output_0 /blocks.17/self_attn/Constant_51"Constant*H value*<B,/blocks.17/self_attn/Constant_51_attr::valueJ  '/blocks.17/self_attn/Gather_12_output_0 )/blocks.17/self_attn/Constant_51_output_0*/blocks.17/self_attn/Unsqueeze_24_output_0!/blocks.17/self_attn/Unsqueeze_24" Unsqueeze )/blocks.17/self_attn/Constant_52_output_0 /blocks.17/self_attn/Constant_52"Constant*H value*<B,/blocks.17/self_attn/Constant_52_attr::valueJ  '/blocks.17/self_attn/Gather_13_output_0 )/blocks.17/self_attn/Constant_52_output_0*/blocks.17/self_attn/Unsqueeze_25_output_0!/blocks.17/self_attn/Unsqueeze_25" Unsqueeze  */blocks.17/self_attn/Unsqueeze_22_output_0 */blocks.17/self_attn/Unsqueeze_23_output_0 )/blocks.17/self_attn/Constant_50_output_0 */blocks.17/self_attn/Unsqueeze_24_output_0 */blocks.17/self_attn/Unsqueeze_25_output_0'/blocks.17/self_attn/Concat_10_output_0/blocks.17/self_attn/Concat_10"Concat* axis )/blocks.17/self_attn/Constant_53_output_0 /blocks.17/self_attn/Constant_53"Constant*H value*<B,/blocks.17/self_attn/Constant_53_attr::valueJ  '/blocks.17/self_attn/Concat_10_output_0 )/blocks.17/self_attn/Constant_53_output_0'/blocks.17/self_attn/Reshape_5_output_0/blocks.17/self_attn/Reshape_5"Reshape* allowzero w '/blocks.17/self_attn/Reshape_5_output_0&/blocks.17/self_attn/Shape_13_output_0/blocks.17/self_attn/Shape_13"Shape  &/blocks.17/self_attn/Shape_13_output_0//blocks.17/self_attn/ConstantOfShape_1_output_0&/blocks.17/self_attn/ConstantOfShape_1"ConstantOfShape*N value*BB2/blocks.17/self_attn/ConstantOfShape_1_attr::valueJ )/blocks.17/self_attn/Constant_54_output_0 /blocks.17/self_attn/Constant_54"Constant*F value*:B,/blocks.17/self_attn/Constant_54_attr::valueJ  //blocks.17/self_attn/ConstantOfShape_1_output_0 )/blocks.17/self_attn/Constant_54_output_0#/blocks.17/self_attn/Mul_6_output_0/blocks.17/self_attn/Mul_6"Mul  '/blocks.17/self_attn/Reshape_5_output_0 #/blocks.17/self_attn/Mul_6_output_0%/blocks.17/self_attn/Equal_1_output_0/blocks.17/self_attn/Equal_1"Equal  %/blocks.17/self_attn/Equal_1_output_0 //blocks.17/self_attn/ConstantOfShape_1_output_0 '/blocks.17/self_attn/Reshape_5_output_0%/blocks.17/self_attn/Where_1_output_0/blocks.17/self_attn/Where_1"Where  */blocks.17/self_attn/Unsqueeze_21_output_0 %/blocks.17/self_attn/Where_1_output_0&/blocks.17/self_attn/Expand_1_output_0/blocks.17/self_attn/Expand_1"Expand )/blocks.17/self_attn/Constant_55_output_0 /blocks.17/self_attn/Constant_55"Constant*F value*:B,/blocks.17/self_attn/Constant_55_attr::valueJ  '/blocks.17/self_attn/Gather_11_output_0 )/blocks.17/self_attn/Constant_55_output_0#/blocks.17/self_attn/Mul_7_output_0/blocks.17/self_attn/Mul_7"Mul fonnx::Unsqueeze_5524 Constant_7210"Constant*5 value*)BConstant_7210_attr::valueJ  '/blocks.17/self_attn/Gather_10_output_0 onnx::Unsqueeze_5524*/blocks.17/self_attn/Unsqueeze_26_output_0!/blocks.17/self_attn/Unsqueeze_26" Unsqueeze fonnx::Unsqueeze_5526 Constant_7212"Constant*5 value*)BConstant_7212_attr::valueJ  #/blocks.17/self_attn/Mul_7_output_0 onnx::Unsqueeze_5526*/blocks.17/self_attn/Unsqueeze_27_output_0!/blocks.17/self_attn/Unsqueeze_27" Unsqueeze fonnx::Unsqueeze_5528 Constant_7214"Constant*5 value*)BConstant_7214_attr::valueJ  '/blocks.17/self_attn/Gather_12_output_0 onnx::Unsqueeze_5528*/blocks.17/self_attn/Unsqueeze_28_output_0!/blocks.17/self_attn/Unsqueeze_28" Unsqueeze fonnx::Unsqueeze_5530 Constant_7216"Constant*5 value*)BConstant_7216_attr::valueJ  '/blocks.17/self_attn/Gather_13_output_0 onnx::Unsqueeze_5530*/blocks.17/self_attn/Unsqueeze_29_output_0!/blocks.17/self_attn/Unsqueeze_29" Unsqueeze  */blocks.17/self_attn/Unsqueeze_26_output_0 */blocks.17/self_attn/Unsqueeze_27_output_0 */blocks.17/self_attn/Unsqueeze_28_output_0 */blocks.17/self_attn/Unsqueeze_29_output_0'/blocks.17/self_attn/Concat_11_output_0/blocks.17/self_attn/Concat_11"Concat* axis  &/blocks.17/self_attn/Expand_1_output_0 '/blocks.17/self_attn/Concat_11_output_0'/blocks.17/self_attn/Reshape_6_output_0/blocks.17/self_attn/Reshape_6"Reshape* allowzero  '/blocks.17/self_attn/Transpose_output_0 '/blocks.17/self_attn/Reshape_4_output_0$/blocks.17/self_attn/MatMul_output_0/blocks.17/self_attn/MatMul"MatMul )/blocks.17/self_attn/Constant_56_output_0 /blocks.17/self_attn/Constant_56"Constant*B value*6B,/blocks.17/self_attn/Constant_56_attr::valueJ5A  $/blocks.17/self_attn/MatMul_output_0 )/blocks.17/self_attn/Constant_56_output_0#/blocks.17/self_attn/Div_2_output_0/blocks.17/self_attn/Div_2"Div { #/blocks.17/self_attn/Div_2_output_0 attention_mask#/blocks.17/self_attn/Add_2_output_0/blocks.17/self_attn/Add_2"Add  #/blocks.17/self_attn/Add_2_output_0%/blocks.17/self_attn/Softmax_output_0/blocks.17/self_attn/Softmax"Softmax* axis { %/blocks.17/self_attn/Softmax_output_0$/blocks.17/self_attn/Cast_4_output_0/blocks.17/self_attn/Cast_4"Cast* to  $/blocks.17/self_attn/Cast_4_output_0 '/blocks.17/self_attn/Reshape_6_output_0&/blocks.17/self_attn/MatMul_1_output_0/blocks.17/self_attn/MatMul_1"MatMul  &/blocks.17/self_attn/MatMul_1_output_0)/blocks.17/self_attn/Transpose_3_output_0 /blocks.17/self_attn/Transpose_3" Transpose* perm@@@@ fonnx::Unsqueeze_5542 Constant_7228"Constant*5 value*)BConstant_7228_attr::valueJ  $/blocks.17/self_attn/Gather_output_0 onnx::Unsqueeze_5542*/blocks.17/self_attn/Unsqueeze_30_output_0!/blocks.17/self_attn/Unsqueeze_30" Unsqueeze fonnx::Unsqueeze_5544 Constant_7230"Constant*5 value*)BConstant_7230_attr::valueJ  &/blocks.17/self_attn/Gather_1_output_0 onnx::Unsqueeze_5544*/blocks.17/self_attn/Unsqueeze_31_output_0!/blocks.17/self_attn/Unsqueeze_31" Unsqueeze )/blocks.17/self_attn/Constant_57_output_0 /blocks.17/self_attn/Constant_57"Constant*H value*<B,/blocks.17/self_attn/Constant_57_attr::valueJ  */blocks.17/self_attn/Unsqueeze_30_output_0 */blocks.17/self_attn/Unsqueeze_31_output_0 )/blocks.17/self_attn/Constant_57_output_0'/blocks.17/self_attn/Concat_12_output_0/blocks.17/self_attn/Concat_12"Concat* axis  )/blocks.17/self_attn/Transpose_3_output_0 '/blocks.17/self_attn/Concat_12_output_0'/blocks.17/self_attn/Reshape_7_output_0/blocks.17/self_attn/Reshape_7"Reshape* allowzero  '/blocks.17/self_attn/Reshape_7_output_0 onnx::MatMul_9065+/blocks.17/self_attn/o_proj/MatMul_output_0"/blocks.17/self_attn/o_proj/MatMul"MatMul  */blocks.17/input_layernorm/Cast_1_output_0 +/blocks.17/self_attn/o_proj/MatMul_output_0/blocks.17/Add_output_0/blocks.17/Add"Add  /blocks.17/Add_output_01/blocks.17/post_attention_layernorm/Cast_output_0(/blocks.17/post_attention_layernorm/Cast"Cast* to 5/blocks.17/post_attention_layernorm/Constant_output_0,/blocks.17/post_attention_layernorm/Constant"Constant*N value*BB8/blocks.17/post_attention_layernorm/Constant_attr::valueJ@  1/blocks.17/post_attention_layernorm/Cast_output_0 5/blocks.17/post_attention_layernorm/Constant_output_00/blocks.17/post_attention_layernorm/Pow_output_0'/blocks.17/post_attention_layernorm/Pow"Pow  0/blocks.17/post_attention_layernorm/Pow_output_07/blocks.17/post_attention_layernorm/ReduceMean_output_0./blocks.17/post_attention_layernorm/ReduceMean" ReduceMean* axes@* keepdims 7/blocks.17/post_attention_layernorm/Constant_1_output_0./blocks.17/post_attention_layernorm/Constant_1"Constant*P value*DB:/blocks.17/post_attention_layernorm/Constant_1_attr::valueJ75  7/blocks.17/post_attention_layernorm/ReduceMean_output_0 7/blocks.17/post_attention_layernorm/Constant_1_output_00/blocks.17/post_attention_layernorm/Add_output_0'/blocks.17/post_attention_layernorm/Add"Add  0/blocks.17/post_attention_layernorm/Add_output_01/blocks.17/post_attention_layernorm/Sqrt_output_0(/blocks.17/post_attention_layernorm/Sqrt"Sqrt 7/blocks.17/post_attention_layernorm/Constant_2_output_0./blocks.17/post_attention_layernorm/Constant_2"Constant*P value*DB:/blocks.17/post_attention_layernorm/Constant_2_attr::valueJ?  7/blocks.17/post_attention_layernorm/Constant_2_output_0 1/blocks.17/post_attention_layernorm/Sqrt_output_00/blocks.17/post_attention_layernorm/Div_output_0'/blocks.17/post_attention_layernorm/Div"Div  1/blocks.17/post_attention_layernorm/Cast_output_03/blocks.17/post_attention_layernorm/Cast_1_output_0*/blocks.17/post_attention_layernorm/Cast_1"Cast* to  3/blocks.17/post_attention_layernorm/Cast_1_output_0 0/blocks.17/post_attention_layernorm/Div_output_00/blocks.17/post_attention_layernorm/Mul_output_0'/blocks.17/post_attention_layernorm/Mul"Mul  0/blocks.17/post_attention_layernorm/Mul_output_0 )blocks.17.post_attention_layernorm.weight2/blocks.17/post_attention_layernorm/Mul_1_output_0)/blocks.17/post_attention_layernorm/Mul_1"Mul  2/blocks.17/post_attention_layernorm/Mul_1_output_03/blocks.17/post_attention_layernorm/Cast_2_output_0*/blocks.17/post_attention_layernorm/Cast_2"Cast* to  3/blocks.17/post_attention_layernorm/Cast_2_output_0 onnx::MatMul_9066(/blocks.17/mlp/gate_proj/MatMul_output_0/blocks.17/mlp/gate_proj/MatMul"MatMul z (/blocks.17/mlp/gate_proj/MatMul_output_0&/blocks.17/mlp/act_fn/Sigmoid_output_0/blocks.17/mlp/act_fn/Sigmoid"Sigmoid  (/blocks.17/mlp/gate_proj/MatMul_output_0 &/blocks.17/mlp/act_fn/Sigmoid_output_0"/blocks.17/mlp/act_fn/Mul_output_0/blocks.17/mlp/act_fn/Mul"Mul  3/blocks.17/post_attention_layernorm/Cast_2_output_0 onnx::MatMul_9067&/blocks.17/mlp/up_proj/MatMul_output_0/blocks.17/mlp/up_proj/MatMul"MatMul  "/blocks.17/mlp/act_fn/Mul_output_0 &/blocks.17/mlp/up_proj/MatMul_output_0/blocks.17/mlp/Mul_output_0/blocks.17/mlp/Mul"Mul  /blocks.17/mlp/Mul_output_0 onnx::MatMul_9068(/blocks.17/mlp/down_proj/MatMul_output_0/blocks.17/mlp/down_proj/MatMul"MatMul  3/blocks.17/post_attention_layernorm/Cast_1_output_0 (/blocks.17/mlp/down_proj/MatMul_output_0/blocks.17/Add_1_output_0/blocks.17/Add_1"Add c/Constant_10_output_0 /Constant_10"Constant*2 value*&B/Constant_10_attr::valueJ ^ past_key_values /Constant_10_output_0/Gather_18_output_0 /Gather_18"Gather* axis /blocks.18/Constant_output_0/blocks.18/Constant"Constant*K value*?B/blocks.18/Constant_attr::valueJ  /blocks.17/Add_1_output_0 /blocks.18/Constant_output_0/blocks.18/Reshape_output_0/blocks.18/Reshape"Reshape* allowzero y /blocks.18/Reshape_output_0(/blocks.18/input_layernorm/Cast_output_0/blocks.18/input_layernorm/Cast"Cast* to ,/blocks.18/input_layernorm/Constant_output_0#/blocks.18/input_layernorm/Constant"Constant*E value*9B//blocks.18/input_layernorm/Constant_attr::valueJ@  (/blocks.18/input_layernorm/Cast_output_0 ,/blocks.18/input_layernorm/Constant_output_0'/blocks.18/input_layernorm/Pow_output_0/blocks.18/input_layernorm/Pow"Pow  '/blocks.18/input_layernorm/Pow_output_0./blocks.18/input_layernorm/ReduceMean_output_0%/blocks.18/input_layernorm/ReduceMean" ReduceMean* axes@* keepdims ./blocks.18/input_layernorm/Constant_1_output_0%/blocks.18/input_layernorm/Constant_1"Constant*G value*;B1/blocks.18/input_layernorm/Constant_1_attr::valueJ75  ./blocks.18/input_layernorm/ReduceMean_output_0 ./blocks.18/input_layernorm/Constant_1_output_0'/blocks.18/input_layernorm/Add_output_0/blocks.18/input_layernorm/Add"Add z '/blocks.18/input_layernorm/Add_output_0(/blocks.18/input_layernorm/Sqrt_output_0/blocks.18/input_layernorm/Sqrt"Sqrt ./blocks.18/input_layernorm/Constant_2_output_0%/blocks.18/input_layernorm/Constant_2"Constant*G value*;B1/blocks.18/input_layernorm/Constant_2_attr::valueJ?  ./blocks.18/input_layernorm/Constant_2_output_0 (/blocks.18/input_layernorm/Sqrt_output_0'/blocks.18/input_layernorm/Div_output_0/blocks.18/input_layernorm/Div"Div  (/blocks.18/input_layernorm/Cast_output_0*/blocks.18/input_layernorm/Cast_1_output_0!/blocks.18/input_layernorm/Cast_1"Cast* to  */blocks.18/input_layernorm/Cast_1_output_0 '/blocks.18/input_layernorm/Div_output_0'/blocks.18/input_layernorm/Mul_output_0/blocks.18/input_layernorm/Mul"Mul  '/blocks.18/input_layernorm/Mul_output_0 blocks.18.input_layernorm.weight)/blocks.18/input_layernorm/Mul_1_output_0 /blocks.18/input_layernorm/Mul_1"Mul  )/blocks.18/input_layernorm/Mul_1_output_0*/blocks.18/input_layernorm/Cast_2_output_0!/blocks.18/input_layernorm/Cast_2"Cast* to t */blocks.18/input_layernorm/Cast_2_output_0#/blocks.18/self_attn/Shape_output_0/blocks.18/self_attn/Shape"Shape &/blocks.18/self_attn/Constant_output_0/blocks.18/self_attn/Constant"Constant*C value*7B)/blocks.18/self_attn/Constant_attr::valueJ  #/blocks.18/self_attn/Shape_output_0 &/blocks.18/self_attn/Constant_output_0$/blocks.18/self_attn/Gather_output_0/blocks.18/self_attn/Gather"Gather* axis x */blocks.18/input_layernorm/Cast_2_output_0%/blocks.18/self_attn/Shape_1_output_0/blocks.18/self_attn/Shape_1"Shape (/blocks.18/self_attn/Constant_1_output_0/blocks.18/self_attn/Constant_1"Constant*E value*9B+/blocks.18/self_attn/Constant_1_attr::valueJ  %/blocks.18/self_attn/Shape_1_output_0 (/blocks.18/self_attn/Constant_1_output_0&/blocks.18/self_attn/Gather_1_output_0/blocks.18/self_attn/Gather_1"Gather* axis  */blocks.18/input_layernorm/Cast_2_output_0 onnx::MatMul_9069+/blocks.18/self_attn/q_proj/MatMul_output_0"/blocks.18/self_attn/q_proj/MatMul"MatMul  */blocks.18/input_layernorm/Cast_2_output_0 onnx::MatMul_9070+/blocks.18/self_attn/k_proj/MatMul_output_0"/blocks.18/self_attn/k_proj/MatMul"MatMul  */blocks.18/input_layernorm/Cast_2_output_0 onnx::MatMul_9071+/blocks.18/self_attn/v_proj/MatMul_output_0"/blocks.18/self_attn/v_proj/MatMul"MatMul fonnx::Unsqueeze_5605 Constant_7283"Constant*5 value*)BConstant_7283_attr::valueJ  $/blocks.18/self_attn/Gather_output_0 onnx::Unsqueeze_5605'/blocks.18/self_attn/Unsqueeze_output_0/blocks.18/self_attn/Unsqueeze" Unsqueeze fonnx::Unsqueeze_5607 Constant_7285"Constant*5 value*)BConstant_7285_attr::valueJ  &/blocks.18/self_attn/Gather_1_output_0 onnx::Unsqueeze_5607)/blocks.18/self_attn/Unsqueeze_1_output_0 /blocks.18/self_attn/Unsqueeze_1" Unsqueeze (/blocks.18/self_attn/Constant_2_output_0/blocks.18/self_attn/Constant_2"Constant*G value*;B+/blocks.18/self_attn/Constant_2_attr::valueJ (/blocks.18/self_attn/Constant_3_output_0/blocks.18/self_attn/Constant_3"Constant*G value*;B+/blocks.18/self_attn/Constant_3_attr::valueJ  '/blocks.18/self_attn/Unsqueeze_output_0 )/blocks.18/self_attn/Unsqueeze_1_output_0 (/blocks.18/self_attn/Constant_2_output_0 (/blocks.18/self_attn/Constant_3_output_0$/blocks.18/self_attn/Concat_output_0/blocks.18/self_attn/Concat"Concat* axis  +/blocks.18/self_attn/q_proj/MatMul_output_0 $/blocks.18/self_attn/Concat_output_0%/blocks.18/self_attn/Reshape_output_0/blocks.18/self_attn/Reshape"Reshape* allowzero fonnx::Unsqueeze_5615 Constant_7291"Constant*5 value*)BConstant_7291_attr::valueJ  $/blocks.18/self_attn/Gather_output_0 onnx::Unsqueeze_5615)/blocks.18/self_attn/Unsqueeze_2_output_0 /blocks.18/self_attn/Unsqueeze_2" Unsqueeze fonnx::Unsqueeze_5617 Constant_7293"Constant*5 value*)BConstant_7293_attr::valueJ  &/blocks.18/self_attn/Gather_1_output_0 onnx::Unsqueeze_5617)/blocks.18/self_attn/Unsqueeze_3_output_0 /blocks.18/self_attn/Unsqueeze_3" Unsqueeze (/blocks.18/self_attn/Constant_4_output_0/blocks.18/self_attn/Constant_4"Constant*G value*;B+/blocks.18/self_attn/Constant_4_attr::valueJ (/blocks.18/self_attn/Constant_5_output_0/blocks.18/self_attn/Constant_5"Constant*G value*;B+/blocks.18/self_attn/Constant_5_attr::valueJ  )/blocks.18/self_attn/Unsqueeze_2_output_0 )/blocks.18/self_attn/Unsqueeze_3_output_0 (/blocks.18/self_attn/Constant_4_output_0 (/blocks.18/self_attn/Constant_5_output_0&/blocks.18/self_attn/Concat_1_output_0/blocks.18/self_attn/Concat_1"Concat* axis fonnx::Unsqueeze_5624 Constant_7298"Constant*5 value*)BConstant_7298_attr::valueJ  $/blocks.18/self_attn/Gather_output_0 onnx::Unsqueeze_5624)/blocks.18/self_attn/Unsqueeze_4_output_0 /blocks.18/self_attn/Unsqueeze_4" Unsqueeze fonnx::Unsqueeze_5626 Constant_7300"Constant*5 value*)BConstant_7300_attr::valueJ  &/blocks.18/self_attn/Gather_1_output_0 onnx::Unsqueeze_5626)/blocks.18/self_attn/Unsqueeze_5_output_0 /blocks.18/self_attn/Unsqueeze_5" Unsqueeze (/blocks.18/self_attn/Constant_6_output_0/blocks.18/self_attn/Constant_6"Constant*G value*;B+/blocks.18/self_attn/Constant_6_attr::valueJ (/blocks.18/self_attn/Constant_7_output_0/blocks.18/self_attn/Constant_7"Constant*G value*;B+/blocks.18/self_attn/Constant_7_attr::valueJ  )/blocks.18/self_attn/Unsqueeze_4_output_0 )/blocks.18/self_attn/Unsqueeze_5_output_0 (/blocks.18/self_attn/Constant_6_output_0 (/blocks.18/self_attn/Constant_7_output_0&/blocks.18/self_attn/Concat_2_output_0/blocks.18/self_attn/Concat_2"Concat* axis  +/blocks.18/self_attn/k_proj/MatMul_output_0 &/blocks.18/self_attn/Concat_1_output_0'/blocks.18/self_attn/Reshape_1_output_0/blocks.18/self_attn/Reshape_1"Reshape* allowzero  +/blocks.18/self_attn/v_proj/MatMul_output_0 &/blocks.18/self_attn/Concat_2_output_0'/blocks.18/self_attn/Reshape_2_output_0/blocks.18/self_attn/Reshape_2"Reshape* allowzero  %/blocks.18/self_attn/Reshape_output_0)/blocks.18/self_attn/q_norm/Cast_output_0 /blocks.18/self_attn/q_norm/Cast"Cast* to -/blocks.18/self_attn/q_norm/Constant_output_0$/blocks.18/self_attn/q_norm/Constant"Constant*F value*:B0/blocks.18/self_attn/q_norm/Constant_attr::valueJ@  )/blocks.18/self_attn/q_norm/Cast_output_0 -/blocks.18/self_attn/q_norm/Constant_output_0(/blocks.18/self_attn/q_norm/Pow_output_0/blocks.18/self_attn/q_norm/Pow"Pow  (/blocks.18/self_attn/q_norm/Pow_output_0//blocks.18/self_attn/q_norm/ReduceMean_output_0&/blocks.18/self_attn/q_norm/ReduceMean" ReduceMean* axes@* keepdims //blocks.18/self_attn/q_norm/Constant_1_output_0&/blocks.18/self_attn/q_norm/Constant_1"Constant*H value*<B2/blocks.18/self_attn/q_norm/Constant_1_attr::valueJ75  //blocks.18/self_attn/q_norm/ReduceMean_output_0 //blocks.18/self_attn/q_norm/Constant_1_output_0(/blocks.18/self_attn/q_norm/Add_output_0/blocks.18/self_attn/q_norm/Add"Add } (/blocks.18/self_attn/q_norm/Add_output_0)/blocks.18/self_attn/q_norm/Sqrt_output_0 /blocks.18/self_attn/q_norm/Sqrt"Sqrt //blocks.18/self_attn/q_norm/Constant_2_output_0&/blocks.18/self_attn/q_norm/Constant_2"Constant*H value*<B2/blocks.18/self_attn/q_norm/Constant_2_attr::valueJ?  //blocks.18/self_attn/q_norm/Constant_2_output_0 )/blocks.18/self_attn/q_norm/Sqrt_output_0(/blocks.18/self_attn/q_norm/Div_output_0/blocks.18/self_attn/q_norm/Div"Div  )/blocks.18/self_attn/q_norm/Cast_output_0+/blocks.18/self_attn/q_norm/Cast_1_output_0"/blocks.18/self_attn/q_norm/Cast_1"Cast* to  +/blocks.18/self_attn/q_norm/Cast_1_output_0 (/blocks.18/self_attn/q_norm/Div_output_0(/blocks.18/self_attn/q_norm/Mul_output_0/blocks.18/self_attn/q_norm/Mul"Mul  (/blocks.18/self_attn/q_norm/Mul_output_0 !blocks.18.self_attn.q_norm.weight*/blocks.18/self_attn/q_norm/Mul_1_output_0!/blocks.18/self_attn/q_norm/Mul_1"Mul  */blocks.18/self_attn/q_norm/Mul_1_output_0+/blocks.18/self_attn/q_norm/Cast_2_output_0"/blocks.18/self_attn/q_norm/Cast_2"Cast* to  '/blocks.18/self_attn/Reshape_1_output_0)/blocks.18/self_attn/k_norm/Cast_output_0 /blocks.18/self_attn/k_norm/Cast"Cast* to -/blocks.18/self_attn/k_norm/Constant_output_0$/blocks.18/self_attn/k_norm/Constant"Constant*F value*:B0/blocks.18/self_attn/k_norm/Constant_attr::valueJ@  )/blocks.18/self_attn/k_norm/Cast_output_0 -/blocks.18/self_attn/k_norm/Constant_output_0(/blocks.18/self_attn/k_norm/Pow_output_0/blocks.18/self_attn/k_norm/Pow"Pow  (/blocks.18/self_attn/k_norm/Pow_output_0//blocks.18/self_attn/k_norm/ReduceMean_output_0&/blocks.18/self_attn/k_norm/ReduceMean" ReduceMean* axes@* keepdims //blocks.18/self_attn/k_norm/Constant_1_output_0&/blocks.18/self_attn/k_norm/Constant_1"Constant*H value*<B2/blocks.18/self_attn/k_norm/Constant_1_attr::valueJ75  //blocks.18/self_attn/k_norm/ReduceMean_output_0 //blocks.18/self_attn/k_norm/Constant_1_output_0(/blocks.18/self_attn/k_norm/Add_output_0/blocks.18/self_attn/k_norm/Add"Add } (/blocks.18/self_attn/k_norm/Add_output_0)/blocks.18/self_attn/k_norm/Sqrt_output_0 /blocks.18/self_attn/k_norm/Sqrt"Sqrt //blocks.18/self_attn/k_norm/Constant_2_output_0&/blocks.18/self_attn/k_norm/Constant_2"Constant*H value*<B2/blocks.18/self_attn/k_norm/Constant_2_attr::valueJ?  //blocks.18/self_attn/k_norm/Constant_2_output_0 )/blocks.18/self_attn/k_norm/Sqrt_output_0(/blocks.18/self_attn/k_norm/Div_output_0/blocks.18/self_attn/k_norm/Div"Div  )/blocks.18/self_attn/k_norm/Cast_output_0+/blocks.18/self_attn/k_norm/Cast_1_output_0"/blocks.18/self_attn/k_norm/Cast_1"Cast* to  +/blocks.18/self_attn/k_norm/Cast_1_output_0 (/blocks.18/self_attn/k_norm/Div_output_0(/blocks.18/self_attn/k_norm/Mul_output_0/blocks.18/self_attn/k_norm/Mul"Mul  (/blocks.18/self_attn/k_norm/Mul_output_0 !blocks.18.self_attn.k_norm.weight*/blocks.18/self_attn/k_norm/Mul_1_output_0!/blocks.18/self_attn/k_norm/Mul_1"Mul  */blocks.18/self_attn/k_norm/Mul_1_output_0+/blocks.18/self_attn/k_norm/Cast_2_output_0"/blocks.18/self_attn/k_norm/Cast_2"Cast* to  +/blocks.18/self_attn/q_norm/Cast_2_output_0 %/blocks.0/self_attn/Gather_2_output_0!/blocks.18/self_attn/Mul_output_0/blocks.18/self_attn/Mul"Mul y +/blocks.18/self_attn/q_norm/Cast_2_output_0%/blocks.18/self_attn/Shape_2_output_0/blocks.18/self_attn/Shape_2"Shape (/blocks.18/self_attn/Constant_8_output_0/blocks.18/self_attn/Constant_8"Constant*E value*9B+/blocks.18/self_attn/Constant_8_attr::valueJ  %/blocks.18/self_attn/Shape_2_output_0 (/blocks.18/self_attn/Constant_8_output_0&/blocks.18/self_attn/Gather_2_output_0/blocks.18/self_attn/Gather_2"Gather* axis (/blocks.18/self_attn/Constant_9_output_0/blocks.18/self_attn/Constant_9"Constant*E value*9B+/blocks.18/self_attn/Constant_9_attr::valueJ  &/blocks.18/self_attn/Gather_2_output_0 (/blocks.18/self_attn/Constant_9_output_0!/blocks.18/self_attn/Div_output_0/blocks.18/self_attn/Div"Div s !/blocks.18/self_attn/Div_output_0"/blocks.18/self_attn/Cast_output_0/blocks.18/self_attn/Cast"Cast* to x "/blocks.18/self_attn/Cast_output_0$/blocks.18/self_attn/Cast_1_output_0/blocks.18/self_attn/Cast_1"Cast* to )/blocks.18/self_attn/Constant_10_output_0 /blocks.18/self_attn/Constant_10"Constant*H value*<B,/blocks.18/self_attn/Constant_10_attr::valueJ )/blocks.18/self_attn/Constant_11_output_0 /blocks.18/self_attn/Constant_11"Constant*H value*<B,/blocks.18/self_attn/Constant_11_attr::valueJ )/blocks.18/self_attn/Constant_12_output_0 /blocks.18/self_attn/Constant_12"Constant*H value*<B,/blocks.18/self_attn/Constant_12_attr::valueJ  $/blocks.18/self_attn/Cast_1_output_0 )/blocks.18/self_attn/Constant_12_output_0)/blocks.18/self_attn/Unsqueeze_6_output_0 /blocks.18/self_attn/Unsqueeze_6" Unsqueeze )/blocks.18/self_attn/Constant_13_output_0 /blocks.18/self_attn/Constant_13"Constant*H value*<B,/blocks.18/self_attn/Constant_13_attr::valueJ  +/blocks.18/self_attn/q_norm/Cast_2_output_0 )/blocks.18/self_attn/Constant_11_output_0 )/blocks.18/self_attn/Unsqueeze_6_output_0 )/blocks.18/self_attn/Constant_10_output_0 )/blocks.18/self_attn/Constant_13_output_0#/blocks.18/self_attn/Slice_output_0/blocks.18/self_attn/Slice"Slice )/blocks.18/self_attn/Constant_14_output_0 /blocks.18/self_attn/Constant_14"Constant*H value*<B,/blocks.18/self_attn/Constant_14_attr::valueJ )/blocks.18/self_attn/Constant_15_output_0 /blocks.18/self_attn/Constant_15"Constant*H value*<B,/blocks.18/self_attn/Constant_15_attr::valueJ  $/blocks.18/self_attn/Cast_1_output_0 )/blocks.18/self_attn/Constant_15_output_0)/blocks.18/self_attn/Unsqueeze_7_output_0 /blocks.18/self_attn/Unsqueeze_7" Unsqueeze )/blocks.18/self_attn/Constant_16_output_0 /blocks.18/self_attn/Constant_16"Constant*H value*<B,/blocks.18/self_attn/Constant_16_attr::valueJ )/blocks.18/self_attn/Constant_17_output_0 /blocks.18/self_attn/Constant_17"Constant*H value*<B,/blocks.18/self_attn/Constant_17_attr::valueJ  +/blocks.18/self_attn/q_norm/Cast_2_output_0 )/blocks.18/self_attn/Unsqueeze_7_output_0 )/blocks.18/self_attn/Constant_16_output_0 )/blocks.18/self_attn/Constant_14_output_0 )/blocks.18/self_attn/Constant_17_output_0%/blocks.18/self_attn/Slice_1_output_0/blocks.18/self_attn/Slice_1"Slice i %/blocks.18/self_attn/Slice_1_output_0!/blocks.18/self_attn/Neg_output_0/blocks.18/self_attn/Neg"Neg  !/blocks.18/self_attn/Neg_output_0 #/blocks.18/self_attn/Slice_output_0&/blocks.18/self_attn/Concat_3_output_0/blocks.18/self_attn/Concat_3"Concat* axis  &/blocks.18/self_attn/Concat_3_output_0 %/blocks.0/self_attn/Gather_3_output_0#/blocks.18/self_attn/Mul_1_output_0/blocks.18/self_attn/Mul_1"Mul  !/blocks.18/self_attn/Mul_output_0 #/blocks.18/self_attn/Mul_1_output_0!/blocks.18/self_attn/Add_output_0/blocks.18/self_attn/Add"Add  +/blocks.18/self_attn/k_norm/Cast_2_output_0 %/blocks.0/self_attn/Gather_2_output_0#/blocks.18/self_attn/Mul_2_output_0/blocks.18/self_attn/Mul_2"Mul y +/blocks.18/self_attn/k_norm/Cast_2_output_0%/blocks.18/self_attn/Shape_3_output_0/blocks.18/self_attn/Shape_3"Shape )/blocks.18/self_attn/Constant_18_output_0 /blocks.18/self_attn/Constant_18"Constant*F value*:B,/blocks.18/self_attn/Constant_18_attr::valueJ  %/blocks.18/self_attn/Shape_3_output_0 )/blocks.18/self_attn/Constant_18_output_0&/blocks.18/self_attn/Gather_3_output_0/blocks.18/self_attn/Gather_3"Gather* axis )/blocks.18/self_attn/Constant_19_output_0 /blocks.18/self_attn/Constant_19"Constant*F value*:B,/blocks.18/self_attn/Constant_19_attr::valueJ  &/blocks.18/self_attn/Gather_3_output_0 )/blocks.18/self_attn/Constant_19_output_0#/blocks.18/self_attn/Div_1_output_0/blocks.18/self_attn/Div_1"Div y #/blocks.18/self_attn/Div_1_output_0$/blocks.18/self_attn/Cast_2_output_0/blocks.18/self_attn/Cast_2"Cast* to z $/blocks.18/self_attn/Cast_2_output_0$/blocks.18/self_attn/Cast_3_output_0/blocks.18/self_attn/Cast_3"Cast* to )/blocks.18/self_attn/Constant_20_output_0 /blocks.18/self_attn/Constant_20"Constant*H value*<B,/blocks.18/self_attn/Constant_20_attr::valueJ )/blocks.18/self_attn/Constant_21_output_0 /blocks.18/self_attn/Constant_21"Constant*H value*<B,/blocks.18/self_attn/Constant_21_attr::valueJ )/blocks.18/self_attn/Constant_22_output_0 /blocks.18/self_attn/Constant_22"Constant*H value*<B,/blocks.18/self_attn/Constant_22_attr::valueJ  $/blocks.18/self_attn/Cast_3_output_0 )/blocks.18/self_attn/Constant_22_output_0)/blocks.18/self_attn/Unsqueeze_8_output_0 /blocks.18/self_attn/Unsqueeze_8" Unsqueeze )/blocks.18/self_attn/Constant_23_output_0 /blocks.18/self_attn/Constant_23"Constant*H value*<B,/blocks.18/self_attn/Constant_23_attr::valueJ  +/blocks.18/self_attn/k_norm/Cast_2_output_0 )/blocks.18/self_attn/Constant_21_output_0 )/blocks.18/self_attn/Unsqueeze_8_output_0 )/blocks.18/self_attn/Constant_20_output_0 )/blocks.18/self_attn/Constant_23_output_0%/blocks.18/self_attn/Slice_2_output_0/blocks.18/self_attn/Slice_2"Slice )/blocks.18/self_attn/Constant_24_output_0 /blocks.18/self_attn/Constant_24"Constant*H value*<B,/blocks.18/self_attn/Constant_24_attr::valueJ )/blocks.18/self_attn/Constant_25_output_0 /blocks.18/self_attn/Constant_25"Constant*H value*<B,/blocks.18/self_attn/Constant_25_attr::valueJ  $/blocks.18/self_attn/Cast_3_output_0 )/blocks.18/self_attn/Constant_25_output_0)/blocks.18/self_attn/Unsqueeze_9_output_0 /blocks.18/self_attn/Unsqueeze_9" Unsqueeze )/blocks.18/self_attn/Constant_26_output_0 /blocks.18/self_attn/Constant_26"Constant*H value*<B,/blocks.18/self_attn/Constant_26_attr::valueJ )/blocks.18/self_attn/Constant_27_output_0 /blocks.18/self_attn/Constant_27"Constant*H value*<B,/blocks.18/self_attn/Constant_27_attr::valueJ  +/blocks.18/self_attn/k_norm/Cast_2_output_0 )/blocks.18/self_attn/Unsqueeze_9_output_0 )/blocks.18/self_attn/Constant_26_output_0 )/blocks.18/self_attn/Constant_24_output_0 )/blocks.18/self_attn/Constant_27_output_0%/blocks.18/self_attn/Slice_3_output_0/blocks.18/self_attn/Slice_3"Slice m %/blocks.18/self_attn/Slice_3_output_0#/blocks.18/self_attn/Neg_1_output_0/blocks.18/self_attn/Neg_1"Neg  #/blocks.18/self_attn/Neg_1_output_0 %/blocks.18/self_attn/Slice_2_output_0&/blocks.18/self_attn/Concat_4_output_0/blocks.18/self_attn/Concat_4"Concat* axis  &/blocks.18/self_attn/Concat_4_output_0 %/blocks.0/self_attn/Gather_3_output_0#/blocks.18/self_attn/Mul_3_output_0/blocks.18/self_attn/Mul_3"Mul  #/blocks.18/self_attn/Mul_2_output_0 #/blocks.18/self_attn/Mul_3_output_0#/blocks.18/self_attn/Add_1_output_0/blocks.18/self_attn/Add_1"Add  /Gather_18_output_0 /rotary/Constant_3_output_0&/blocks.18/self_attn/Gather_4_output_0/blocks.18/self_attn/Gather_4"Gather* axis  /Gather_18_output_0 /rotary/Constant_8_output_0&/blocks.18/self_attn/Gather_5_output_0/blocks.18/self_attn/Gather_5"Gather* axis  &/blocks.18/self_attn/Gather_4_output_0 #/blocks.18/self_attn/Add_1_output_0&/blocks.18/self_attn/Concat_5_output_0/blocks.18/self_attn/Concat_5"Concat* axis  &/blocks.18/self_attn/Gather_5_output_0 '/blocks.18/self_attn/Reshape_2_output_0&/blocks.18/self_attn/Concat_6_output_0/blocks.18/self_attn/Concat_6"Concat* axis )/blocks.18/self_attn/Constant_28_output_0 /blocks.18/self_attn/Constant_28"Constant*H value*<B,/blocks.18/self_attn/Constant_28_attr::valueJ  &/blocks.18/self_attn/Concat_5_output_0 )/blocks.18/self_attn/Constant_28_output_0*/blocks.18/self_attn/Unsqueeze_10_output_0!/blocks.18/self_attn/Unsqueeze_10" Unsqueeze )/blocks.18/self_attn/Constant_29_output_0 /blocks.18/self_attn/Constant_29"Constant*H value*<B,/blocks.18/self_attn/Constant_29_attr::valueJ  &/blocks.18/self_attn/Concat_6_output_0 )/blocks.18/self_attn/Constant_29_output_0*/blocks.18/self_attn/Unsqueeze_11_output_0!/blocks.18/self_attn/Unsqueeze_11" Unsqueeze  */blocks.18/self_attn/Unsqueeze_10_output_0 */blocks.18/self_attn/Unsqueeze_11_output_0&/blocks.18/self_attn/Concat_7_output_0/blocks.18/self_attn/Concat_7"Concat* axis  !/blocks.18/self_attn/Add_output_0'/blocks.18/self_attn/Transpose_output_0/blocks.18/self_attn/Transpose" Transpose* perm@@@@  &/blocks.18/self_attn/Concat_5_output_0)/blocks.18/self_attn/Transpose_1_output_0 /blocks.18/self_attn/Transpose_1" Transpose* perm@@@@  &/blocks.18/self_attn/Concat_6_output_0)/blocks.18/self_attn/Transpose_2_output_0 /blocks.18/self_attn/Transpose_2" Transpose* perm@@@@ w )/blocks.18/self_attn/Transpose_1_output_0%/blocks.18/self_attn/Shape_4_output_0/blocks.18/self_attn/Shape_4"Shape )/blocks.18/self_attn/Constant_30_output_0 /blocks.18/self_attn/Constant_30"Constant*F value*:B,/blocks.18/self_attn/Constant_30_attr::valueJ  %/blocks.18/self_attn/Shape_4_output_0 )/blocks.18/self_attn/Constant_30_output_0&/blocks.18/self_attn/Gather_6_output_0/blocks.18/self_attn/Gather_6"Gather* axis w )/blocks.18/self_attn/Transpose_1_output_0%/blocks.18/self_attn/Shape_5_output_0/blocks.18/self_attn/Shape_5"Shape )/blocks.18/self_attn/Constant_31_output_0 /blocks.18/self_attn/Constant_31"Constant*F value*:B,/blocks.18/self_attn/Constant_31_attr::valueJ  %/blocks.18/self_attn/Shape_5_output_0 )/blocks.18/self_attn/Constant_31_output_0&/blocks.18/self_attn/Gather_7_output_0/blocks.18/self_attn/Gather_7"Gather* axis w )/blocks.18/self_attn/Transpose_1_output_0%/blocks.18/self_attn/Shape_6_output_0/blocks.18/self_attn/Shape_6"Shape )/blocks.18/self_attn/Constant_32_output_0 /blocks.18/self_attn/Constant_32"Constant*F value*:B,/blocks.18/self_attn/Constant_32_attr::valueJ  %/blocks.18/self_attn/Shape_6_output_0 )/blocks.18/self_attn/Constant_32_output_0&/blocks.18/self_attn/Gather_8_output_0/blocks.18/self_attn/Gather_8"Gather* axis w )/blocks.18/self_attn/Transpose_1_output_0%/blocks.18/self_attn/Shape_7_output_0/blocks.18/self_attn/Shape_7"Shape )/blocks.18/self_attn/Constant_33_output_0 /blocks.18/self_attn/Constant_33"Constant*F value*:B,/blocks.18/self_attn/Constant_33_attr::valueJ  %/blocks.18/self_attn/Shape_7_output_0 )/blocks.18/self_attn/Constant_33_output_0&/blocks.18/self_attn/Gather_9_output_0/blocks.18/self_attn/Gather_9"Gather* axis )/blocks.18/self_attn/Constant_34_output_0 /blocks.18/self_attn/Constant_34"Constant*H value*<B,/blocks.18/self_attn/Constant_34_attr::valueJ  )/blocks.18/self_attn/Transpose_1_output_0 )/blocks.18/self_attn/Constant_34_output_0*/blocks.18/self_attn/Unsqueeze_12_output_0!/blocks.18/self_attn/Unsqueeze_12" Unsqueeze )/blocks.18/self_attn/Constant_35_output_0 /blocks.18/self_attn/Constant_35"Constant*H value*<B,/blocks.18/self_attn/Constant_35_attr::valueJ  &/blocks.18/self_attn/Gather_6_output_0 )/blocks.18/self_attn/Constant_35_output_0*/blocks.18/self_attn/Unsqueeze_13_output_0!/blocks.18/self_attn/Unsqueeze_13" Unsqueeze )/blocks.18/self_attn/Constant_36_output_0 /blocks.18/self_attn/Constant_36"Constant*H value*<B,/blocks.18/self_attn/Constant_36_attr::valueJ  &/blocks.18/self_attn/Gather_7_output_0 )/blocks.18/self_attn/Constant_36_output_0*/blocks.18/self_attn/Unsqueeze_14_output_0!/blocks.18/self_attn/Unsqueeze_14" Unsqueeze )/blocks.18/self_attn/Constant_37_output_0 /blocks.18/self_attn/Constant_37"Constant*H value*<B,/blocks.18/self_attn/Constant_37_attr::valueJ )/blocks.18/self_attn/Constant_38_output_0 /blocks.18/self_attn/Constant_38"Constant*H value*<B,/blocks.18/self_attn/Constant_38_attr::valueJ  &/blocks.18/self_attn/Gather_8_output_0 )/blocks.18/self_attn/Constant_38_output_0*/blocks.18/self_attn/Unsqueeze_15_output_0!/blocks.18/self_attn/Unsqueeze_15" Unsqueeze )/blocks.18/self_attn/Constant_39_output_0 /blocks.18/self_attn/Constant_39"Constant*H value*<B,/blocks.18/self_attn/Constant_39_attr::valueJ  &/blocks.18/self_attn/Gather_9_output_0 )/blocks.18/self_attn/Constant_39_output_0*/blocks.18/self_attn/Unsqueeze_16_output_0!/blocks.18/self_attn/Unsqueeze_16" Unsqueeze  */blocks.18/self_attn/Unsqueeze_13_output_0 */blocks.18/self_attn/Unsqueeze_14_output_0 )/blocks.18/self_attn/Constant_37_output_0 */blocks.18/self_attn/Unsqueeze_15_output_0 */blocks.18/self_attn/Unsqueeze_16_output_0&/blocks.18/self_attn/Concat_8_output_0/blocks.18/self_attn/Concat_8"Concat* axis )/blocks.18/self_attn/Constant_40_output_0 /blocks.18/self_attn/Constant_40"Constant*H value*<B,/blocks.18/self_attn/Constant_40_attr::valueJ  &/blocks.18/self_attn/Concat_8_output_0 )/blocks.18/self_attn/Constant_40_output_0'/blocks.18/self_attn/Reshape_3_output_0/blocks.18/self_attn/Reshape_3"Reshape* allowzero u '/blocks.18/self_attn/Reshape_3_output_0%/blocks.18/self_attn/Shape_8_output_0/blocks.18/self_attn/Shape_8"Shape  %/blocks.18/self_attn/Shape_8_output_0-/blocks.18/self_attn/ConstantOfShape_output_0$/blocks.18/self_attn/ConstantOfShape"ConstantOfShape*L value*@B0/blocks.18/self_attn/ConstantOfShape_attr::valueJ )/blocks.18/self_attn/Constant_41_output_0 /blocks.18/self_attn/Constant_41"Constant*F value*:B,/blocks.18/self_attn/Constant_41_attr::valueJ  -/blocks.18/self_attn/ConstantOfShape_output_0 )/blocks.18/self_attn/Constant_41_output_0#/blocks.18/self_attn/Mul_4_output_0/blocks.18/self_attn/Mul_4"Mul  '/blocks.18/self_attn/Reshape_3_output_0 #/blocks.18/self_attn/Mul_4_output_0#/blocks.18/self_attn/Equal_output_0/blocks.18/self_attn/Equal"Equal  #/blocks.18/self_attn/Equal_output_0 -/blocks.18/self_attn/ConstantOfShape_output_0 '/blocks.18/self_attn/Reshape_3_output_0#/blocks.18/self_attn/Where_output_0/blocks.18/self_attn/Where"Where  */blocks.18/self_attn/Unsqueeze_12_output_0 #/blocks.18/self_attn/Where_output_0$/blocks.18/self_attn/Expand_output_0/blocks.18/self_attn/Expand"Expand )/blocks.18/self_attn/Constant_42_output_0 /blocks.18/self_attn/Constant_42"Constant*F value*:B,/blocks.18/self_attn/Constant_42_attr::valueJ  &/blocks.18/self_attn/Gather_7_output_0 )/blocks.18/self_attn/Constant_42_output_0#/blocks.18/self_attn/Mul_5_output_0/blocks.18/self_attn/Mul_5"Mul fonnx::Unsqueeze_5769 Constant_7428"Constant*5 value*)BConstant_7428_attr::valueJ  &/blocks.18/self_attn/Gather_6_output_0 onnx::Unsqueeze_5769*/blocks.18/self_attn/Unsqueeze_17_output_0!/blocks.18/self_attn/Unsqueeze_17" Unsqueeze fonnx::Unsqueeze_5771 Constant_7430"Constant*5 value*)BConstant_7430_attr::valueJ  #/blocks.18/self_attn/Mul_5_output_0 onnx::Unsqueeze_5771*/blocks.18/self_attn/Unsqueeze_18_output_0!/blocks.18/self_attn/Unsqueeze_18" Unsqueeze fonnx::Unsqueeze_5773 Constant_7432"Constant*5 value*)BConstant_7432_attr::valueJ  &/blocks.18/self_attn/Gather_8_output_0 onnx::Unsqueeze_5773*/blocks.18/self_attn/Unsqueeze_19_output_0!/blocks.18/self_attn/Unsqueeze_19" Unsqueeze fonnx::Unsqueeze_5775 Constant_7434"Constant*5 value*)BConstant_7434_attr::valueJ  &/blocks.18/self_attn/Gather_9_output_0 onnx::Unsqueeze_5775*/blocks.18/self_attn/Unsqueeze_20_output_0!/blocks.18/self_attn/Unsqueeze_20" Unsqueeze  */blocks.18/self_attn/Unsqueeze_17_output_0 */blocks.18/self_attn/Unsqueeze_18_output_0 */blocks.18/self_attn/Unsqueeze_19_output_0 */blocks.18/self_attn/Unsqueeze_20_output_0&/blocks.18/self_attn/Concat_9_output_0/blocks.18/self_attn/Concat_9"Concat* axis  $/blocks.18/self_attn/Expand_output_0 &/blocks.18/self_attn/Concat_9_output_0'/blocks.18/self_attn/Reshape_4_output_0/blocks.18/self_attn/Reshape_4"Reshape* allowzero w )/blocks.18/self_attn/Transpose_2_output_0%/blocks.18/self_attn/Shape_9_output_0/blocks.18/self_attn/Shape_9"Shape )/blocks.18/self_attn/Constant_43_output_0 /blocks.18/self_attn/Constant_43"Constant*F value*:B,/blocks.18/self_attn/Constant_43_attr::valueJ  %/blocks.18/self_attn/Shape_9_output_0 )/blocks.18/self_attn/Constant_43_output_0'/blocks.18/self_attn/Gather_10_output_0/blocks.18/self_attn/Gather_10"Gather* axis y )/blocks.18/self_attn/Transpose_2_output_0&/blocks.18/self_attn/Shape_10_output_0/blocks.18/self_attn/Shape_10"Shape )/blocks.18/self_attn/Constant_44_output_0 /blocks.18/self_attn/Constant_44"Constant*F value*:B,/blocks.18/self_attn/Constant_44_attr::valueJ  &/blocks.18/self_attn/Shape_10_output_0 )/blocks.18/self_attn/Constant_44_output_0'/blocks.18/self_attn/Gather_11_output_0/blocks.18/self_attn/Gather_11"Gather* axis y )/blocks.18/self_attn/Transpose_2_output_0&/blocks.18/self_attn/Shape_11_output_0/blocks.18/self_attn/Shape_11"Shape )/blocks.18/self_attn/Constant_45_output_0 /blocks.18/self_attn/Constant_45"Constant*F value*:B,/blocks.18/self_attn/Constant_45_attr::valueJ  &/blocks.18/self_attn/Shape_11_output_0 )/blocks.18/self_attn/Constant_45_output_0'/blocks.18/self_attn/Gather_12_output_0/blocks.18/self_attn/Gather_12"Gather* axis y )/blocks.18/self_attn/Transpose_2_output_0&/blocks.18/self_attn/Shape_12_output_0/blocks.18/self_attn/Shape_12"Shape )/blocks.18/self_attn/Constant_46_output_0 /blocks.18/self_attn/Constant_46"Constant*F value*:B,/blocks.18/self_attn/Constant_46_attr::valueJ  &/blocks.18/self_attn/Shape_12_output_0 )/blocks.18/self_attn/Constant_46_output_0'/blocks.18/self_attn/Gather_13_output_0/blocks.18/self_attn/Gather_13"Gather* axis )/blocks.18/self_attn/Constant_47_output_0 /blocks.18/self_attn/Constant_47"Constant*H value*<B,/blocks.18/self_attn/Constant_47_attr::valueJ  )/blocks.18/self_attn/Transpose_2_output_0 )/blocks.18/self_attn/Constant_47_output_0*/blocks.18/self_attn/Unsqueeze_21_output_0!/blocks.18/self_attn/Unsqueeze_21" Unsqueeze )/blocks.18/self_attn/Constant_48_output_0 /blocks.18/self_attn/Constant_48"Constant*H value*<B,/blocks.18/self_attn/Constant_48_attr::valueJ  '/blocks.18/self_attn/Gather_10_output_0 )/blocks.18/self_attn/Constant_48_output_0*/blocks.18/self_attn/Unsqueeze_22_output_0!/blocks.18/self_attn/Unsqueeze_22" Unsqueeze )/blocks.18/self_attn/Constant_49_output_0 /blocks.18/self_attn/Constant_49"Constant*H value*<B,/blocks.18/self_attn/Constant_49_attr::valueJ  '/blocks.18/self_attn/Gather_11_output_0 )/blocks.18/self_attn/Constant_49_output_0*/blocks.18/self_attn/Unsqueeze_23_output_0!/blocks.18/self_attn/Unsqueeze_23" Unsqueeze )/blocks.18/self_attn/Constant_50_output_0 /blocks.18/self_attn/Constant_50"Constant*H value*<B,/blocks.18/self_attn/Constant_50_attr::valueJ )/blocks.18/self_attn/Constant_51_output_0 /blocks.18/self_attn/Constant_51"Constant*H value*<B,/blocks.18/self_attn/Constant_51_attr::valueJ  '/blocks.18/self_attn/Gather_12_output_0 )/blocks.18/self_attn/Constant_51_output_0*/blocks.18/self_attn/Unsqueeze_24_output_0!/blocks.18/self_attn/Unsqueeze_24" Unsqueeze )/blocks.18/self_attn/Constant_52_output_0 /blocks.18/self_attn/Constant_52"Constant*H value*<B,/blocks.18/self_attn/Constant_52_attr::valueJ  '/blocks.18/self_attn/Gather_13_output_0 )/blocks.18/self_attn/Constant_52_output_0*/blocks.18/self_attn/Unsqueeze_25_output_0!/blocks.18/self_attn/Unsqueeze_25" Unsqueeze  */blocks.18/self_attn/Unsqueeze_22_output_0 */blocks.18/self_attn/Unsqueeze_23_output_0 )/blocks.18/self_attn/Constant_50_output_0 */blocks.18/self_attn/Unsqueeze_24_output_0 */blocks.18/self_attn/Unsqueeze_25_output_0'/blocks.18/self_attn/Concat_10_output_0/blocks.18/self_attn/Concat_10"Concat* axis )/blocks.18/self_attn/Constant_53_output_0 /blocks.18/self_attn/Constant_53"Constant*H value*<B,/blocks.18/self_attn/Constant_53_attr::valueJ  '/blocks.18/self_attn/Concat_10_output_0 )/blocks.18/self_attn/Constant_53_output_0'/blocks.18/self_attn/Reshape_5_output_0/blocks.18/self_attn/Reshape_5"Reshape* allowzero w '/blocks.18/self_attn/Reshape_5_output_0&/blocks.18/self_attn/Shape_13_output_0/blocks.18/self_attn/Shape_13"Shape  &/blocks.18/self_attn/Shape_13_output_0//blocks.18/self_attn/ConstantOfShape_1_output_0&/blocks.18/self_attn/ConstantOfShape_1"ConstantOfShape*N value*BB2/blocks.18/self_attn/ConstantOfShape_1_attr::valueJ )/blocks.18/self_attn/Constant_54_output_0 /blocks.18/self_attn/Constant_54"Constant*F value*:B,/blocks.18/self_attn/Constant_54_attr::valueJ  //blocks.18/self_attn/ConstantOfShape_1_output_0 )/blocks.18/self_attn/Constant_54_output_0#/blocks.18/self_attn/Mul_6_output_0/blocks.18/self_attn/Mul_6"Mul  '/blocks.18/self_attn/Reshape_5_output_0 #/blocks.18/self_attn/Mul_6_output_0%/blocks.18/self_attn/Equal_1_output_0/blocks.18/self_attn/Equal_1"Equal  %/blocks.18/self_attn/Equal_1_output_0 //blocks.18/self_attn/ConstantOfShape_1_output_0 '/blocks.18/self_attn/Reshape_5_output_0%/blocks.18/self_attn/Where_1_output_0/blocks.18/self_attn/Where_1"Where  */blocks.18/self_attn/Unsqueeze_21_output_0 %/blocks.18/self_attn/Where_1_output_0&/blocks.18/self_attn/Expand_1_output_0/blocks.18/self_attn/Expand_1"Expand )/blocks.18/self_attn/Constant_55_output_0 /blocks.18/self_attn/Constant_55"Constant*F value*:B,/blocks.18/self_attn/Constant_55_attr::valueJ  '/blocks.18/self_attn/Gather_11_output_0 )/blocks.18/self_attn/Constant_55_output_0#/blocks.18/self_attn/Mul_7_output_0/blocks.18/self_attn/Mul_7"Mul fonnx::Unsqueeze_5815 Constant_7473"Constant*5 value*)BConstant_7473_attr::valueJ  '/blocks.18/self_attn/Gather_10_output_0 onnx::Unsqueeze_5815*/blocks.18/self_attn/Unsqueeze_26_output_0!/blocks.18/self_attn/Unsqueeze_26" Unsqueeze fonnx::Unsqueeze_5817 Constant_7475"Constant*5 value*)BConstant_7475_attr::valueJ  #/blocks.18/self_attn/Mul_7_output_0 onnx::Unsqueeze_5817*/blocks.18/self_attn/Unsqueeze_27_output_0!/blocks.18/self_attn/Unsqueeze_27" Unsqueeze fonnx::Unsqueeze_5819 Constant_7477"Constant*5 value*)BConstant_7477_attr::valueJ  '/blocks.18/self_attn/Gather_12_output_0 onnx::Unsqueeze_5819*/blocks.18/self_attn/Unsqueeze_28_output_0!/blocks.18/self_attn/Unsqueeze_28" Unsqueeze fonnx::Unsqueeze_5821 Constant_7479"Constant*5 value*)BConstant_7479_attr::valueJ  '/blocks.18/self_attn/Gather_13_output_0 onnx::Unsqueeze_5821*/blocks.18/self_attn/Unsqueeze_29_output_0!/blocks.18/self_attn/Unsqueeze_29" Unsqueeze  */blocks.18/self_attn/Unsqueeze_26_output_0 */blocks.18/self_attn/Unsqueeze_27_output_0 */blocks.18/self_attn/Unsqueeze_28_output_0 */blocks.18/self_attn/Unsqueeze_29_output_0'/blocks.18/self_attn/Concat_11_output_0/blocks.18/self_attn/Concat_11"Concat* axis  &/blocks.18/self_attn/Expand_1_output_0 '/blocks.18/self_attn/Concat_11_output_0'/blocks.18/self_attn/Reshape_6_output_0/blocks.18/self_attn/Reshape_6"Reshape* allowzero  '/blocks.18/self_attn/Transpose_output_0 '/blocks.18/self_attn/Reshape_4_output_0$/blocks.18/self_attn/MatMul_output_0/blocks.18/self_attn/MatMul"MatMul )/blocks.18/self_attn/Constant_56_output_0 /blocks.18/self_attn/Constant_56"Constant*B value*6B,/blocks.18/self_attn/Constant_56_attr::valueJ5A  $/blocks.18/self_attn/MatMul_output_0 )/blocks.18/self_attn/Constant_56_output_0#/blocks.18/self_attn/Div_2_output_0/blocks.18/self_attn/Div_2"Div { #/blocks.18/self_attn/Div_2_output_0 attention_mask#/blocks.18/self_attn/Add_2_output_0/blocks.18/self_attn/Add_2"Add  #/blocks.18/self_attn/Add_2_output_0%/blocks.18/self_attn/Softmax_output_0/blocks.18/self_attn/Softmax"Softmax* axis { %/blocks.18/self_attn/Softmax_output_0$/blocks.18/self_attn/Cast_4_output_0/blocks.18/self_attn/Cast_4"Cast* to  $/blocks.18/self_attn/Cast_4_output_0 '/blocks.18/self_attn/Reshape_6_output_0&/blocks.18/self_attn/MatMul_1_output_0/blocks.18/self_attn/MatMul_1"MatMul  &/blocks.18/self_attn/MatMul_1_output_0)/blocks.18/self_attn/Transpose_3_output_0 /blocks.18/self_attn/Transpose_3" Transpose* perm@@@@ fonnx::Unsqueeze_5833 Constant_7491"Constant*5 value*)BConstant_7491_attr::valueJ  $/blocks.18/self_attn/Gather_output_0 onnx::Unsqueeze_5833*/blocks.18/self_attn/Unsqueeze_30_output_0!/blocks.18/self_attn/Unsqueeze_30" Unsqueeze fonnx::Unsqueeze_5835 Constant_7493"Constant*5 value*)BConstant_7493_attr::valueJ  &/blocks.18/self_attn/Gather_1_output_0 onnx::Unsqueeze_5835*/blocks.18/self_attn/Unsqueeze_31_output_0!/blocks.18/self_attn/Unsqueeze_31" Unsqueeze )/blocks.18/self_attn/Constant_57_output_0 /blocks.18/self_attn/Constant_57"Constant*H value*<B,/blocks.18/self_attn/Constant_57_attr::valueJ  */blocks.18/self_attn/Unsqueeze_30_output_0 */blocks.18/self_attn/Unsqueeze_31_output_0 )/blocks.18/self_attn/Constant_57_output_0'/blocks.18/self_attn/Concat_12_output_0/blocks.18/self_attn/Concat_12"Concat* axis  )/blocks.18/self_attn/Transpose_3_output_0 '/blocks.18/self_attn/Concat_12_output_0'/blocks.18/self_attn/Reshape_7_output_0/blocks.18/self_attn/Reshape_7"Reshape* allowzero  '/blocks.18/self_attn/Reshape_7_output_0 onnx::MatMul_9093+/blocks.18/self_attn/o_proj/MatMul_output_0"/blocks.18/self_attn/o_proj/MatMul"MatMul  */blocks.18/input_layernorm/Cast_1_output_0 +/blocks.18/self_attn/o_proj/MatMul_output_0/blocks.18/Add_output_0/blocks.18/Add"Add  /blocks.18/Add_output_01/blocks.18/post_attention_layernorm/Cast_output_0(/blocks.18/post_attention_layernorm/Cast"Cast* to 5/blocks.18/post_attention_layernorm/Constant_output_0,/blocks.18/post_attention_layernorm/Constant"Constant*N value*BB8/blocks.18/post_attention_layernorm/Constant_attr::valueJ@  1/blocks.18/post_attention_layernorm/Cast_output_0 5/blocks.18/post_attention_layernorm/Constant_output_00/blocks.18/post_attention_layernorm/Pow_output_0'/blocks.18/post_attention_layernorm/Pow"Pow  0/blocks.18/post_attention_layernorm/Pow_output_07/blocks.18/post_attention_layernorm/ReduceMean_output_0./blocks.18/post_attention_layernorm/ReduceMean" ReduceMean* axes@* keepdims 7/blocks.18/post_attention_layernorm/Constant_1_output_0./blocks.18/post_attention_layernorm/Constant_1"Constant*P value*DB:/blocks.18/post_attention_layernorm/Constant_1_attr::valueJ75  7/blocks.18/post_attention_layernorm/ReduceMean_output_0 7/blocks.18/post_attention_layernorm/Constant_1_output_00/blocks.18/post_attention_layernorm/Add_output_0'/blocks.18/post_attention_layernorm/Add"Add  0/blocks.18/post_attention_layernorm/Add_output_01/blocks.18/post_attention_layernorm/Sqrt_output_0(/blocks.18/post_attention_layernorm/Sqrt"Sqrt 7/blocks.18/post_attention_layernorm/Constant_2_output_0./blocks.18/post_attention_layernorm/Constant_2"Constant*P value*DB:/blocks.18/post_attention_layernorm/Constant_2_attr::valueJ?  7/blocks.18/post_attention_layernorm/Constant_2_output_0 1/blocks.18/post_attention_layernorm/Sqrt_output_00/blocks.18/post_attention_layernorm/Div_output_0'/blocks.18/post_attention_layernorm/Div"Div  1/blocks.18/post_attention_layernorm/Cast_output_03/blocks.18/post_attention_layernorm/Cast_1_output_0*/blocks.18/post_attention_layernorm/Cast_1"Cast* to  3/blocks.18/post_attention_layernorm/Cast_1_output_0 0/blocks.18/post_attention_layernorm/Div_output_00/blocks.18/post_attention_layernorm/Mul_output_0'/blocks.18/post_attention_layernorm/Mul"Mul  0/blocks.18/post_attention_layernorm/Mul_output_0 )blocks.18.post_attention_layernorm.weight2/blocks.18/post_attention_layernorm/Mul_1_output_0)/blocks.18/post_attention_layernorm/Mul_1"Mul  2/blocks.18/post_attention_layernorm/Mul_1_output_03/blocks.18/post_attention_layernorm/Cast_2_output_0*/blocks.18/post_attention_layernorm/Cast_2"Cast* to  3/blocks.18/post_attention_layernorm/Cast_2_output_0 onnx::MatMul_9094(/blocks.18/mlp/gate_proj/MatMul_output_0/blocks.18/mlp/gate_proj/MatMul"MatMul z (/blocks.18/mlp/gate_proj/MatMul_output_0&/blocks.18/mlp/act_fn/Sigmoid_output_0/blocks.18/mlp/act_fn/Sigmoid"Sigmoid  (/blocks.18/mlp/gate_proj/MatMul_output_0 &/blocks.18/mlp/act_fn/Sigmoid_output_0"/blocks.18/mlp/act_fn/Mul_output_0/blocks.18/mlp/act_fn/Mul"Mul  3/blocks.18/post_attention_layernorm/Cast_2_output_0 onnx::MatMul_9095&/blocks.18/mlp/up_proj/MatMul_output_0/blocks.18/mlp/up_proj/MatMul"MatMul  "/blocks.18/mlp/act_fn/Mul_output_0 &/blocks.18/mlp/up_proj/MatMul_output_0/blocks.18/mlp/Mul_output_0/blocks.18/mlp/Mul"Mul  /blocks.18/mlp/Mul_output_0 onnx::MatMul_9096(/blocks.18/mlp/down_proj/MatMul_output_0/blocks.18/mlp/down_proj/MatMul"MatMul  3/blocks.18/post_attention_layernorm/Cast_1_output_0 (/blocks.18/mlp/down_proj/MatMul_output_0/blocks.18/Add_1_output_0/blocks.18/Add_1"Add c/Constant_11_output_0 /Constant_11"Constant*2 value*&B/Constant_11_attr::valueJ ^ past_key_values /Constant_11_output_0/Gather_19_output_0 /Gather_19"Gather* axis /blocks.19/Constant_output_0/blocks.19/Constant"Constant*K value*?B/blocks.19/Constant_attr::valueJ  /blocks.18/Add_1_output_0 /blocks.19/Constant_output_0/blocks.19/Reshape_output_0/blocks.19/Reshape"Reshape* allowzero y /blocks.19/Reshape_output_0(/blocks.19/input_layernorm/Cast_output_0/blocks.19/input_layernorm/Cast"Cast* to ,/blocks.19/input_layernorm/Constant_output_0#/blocks.19/input_layernorm/Constant"Constant*E value*9B//blocks.19/input_layernorm/Constant_attr::valueJ@  (/blocks.19/input_layernorm/Cast_output_0 ,/blocks.19/input_layernorm/Constant_output_0'/blocks.19/input_layernorm/Pow_output_0/blocks.19/input_layernorm/Pow"Pow  '/blocks.19/input_layernorm/Pow_output_0./blocks.19/input_layernorm/ReduceMean_output_0%/blocks.19/input_layernorm/ReduceMean" ReduceMean* axes@* keepdims ./blocks.19/input_layernorm/Constant_1_output_0%/blocks.19/input_layernorm/Constant_1"Constant*G value*;B1/blocks.19/input_layernorm/Constant_1_attr::valueJ75  ./blocks.19/input_layernorm/ReduceMean_output_0 ./blocks.19/input_layernorm/Constant_1_output_0'/blocks.19/input_layernorm/Add_output_0/blocks.19/input_layernorm/Add"Add z '/blocks.19/input_layernorm/Add_output_0(/blocks.19/input_layernorm/Sqrt_output_0/blocks.19/input_layernorm/Sqrt"Sqrt ./blocks.19/input_layernorm/Constant_2_output_0%/blocks.19/input_layernorm/Constant_2"Constant*G value*;B1/blocks.19/input_layernorm/Constant_2_attr::valueJ?  ./blocks.19/input_layernorm/Constant_2_output_0 (/blocks.19/input_layernorm/Sqrt_output_0'/blocks.19/input_layernorm/Div_output_0/blocks.19/input_layernorm/Div"Div  (/blocks.19/input_layernorm/Cast_output_0*/blocks.19/input_layernorm/Cast_1_output_0!/blocks.19/input_layernorm/Cast_1"Cast* to  */blocks.19/input_layernorm/Cast_1_output_0 '/blocks.19/input_layernorm/Div_output_0'/blocks.19/input_layernorm/Mul_output_0/blocks.19/input_layernorm/Mul"Mul  '/blocks.19/input_layernorm/Mul_output_0 blocks.19.input_layernorm.weight)/blocks.19/input_layernorm/Mul_1_output_0 /blocks.19/input_layernorm/Mul_1"Mul  )/blocks.19/input_layernorm/Mul_1_output_0*/blocks.19/input_layernorm/Cast_2_output_0!/blocks.19/input_layernorm/Cast_2"Cast* to t */blocks.19/input_layernorm/Cast_2_output_0#/blocks.19/self_attn/Shape_output_0/blocks.19/self_attn/Shape"Shape &/blocks.19/self_attn/Constant_output_0/blocks.19/self_attn/Constant"Constant*C value*7B)/blocks.19/self_attn/Constant_attr::valueJ  #/blocks.19/self_attn/Shape_output_0 &/blocks.19/self_attn/Constant_output_0$/blocks.19/self_attn/Gather_output_0/blocks.19/self_attn/Gather"Gather* axis x */blocks.19/input_layernorm/Cast_2_output_0%/blocks.19/self_attn/Shape_1_output_0/blocks.19/self_attn/Shape_1"Shape (/blocks.19/self_attn/Constant_1_output_0/blocks.19/self_attn/Constant_1"Constant*E value*9B+/blocks.19/self_attn/Constant_1_attr::valueJ  %/blocks.19/self_attn/Shape_1_output_0 (/blocks.19/self_attn/Constant_1_output_0&/blocks.19/self_attn/Gather_1_output_0/blocks.19/self_attn/Gather_1"Gather* axis  */blocks.19/input_layernorm/Cast_2_output_0 onnx::MatMul_9097+/blocks.19/self_attn/q_proj/MatMul_output_0"/blocks.19/self_attn/q_proj/MatMul"MatMul  */blocks.19/input_layernorm/Cast_2_output_0 onnx::MatMul_9098+/blocks.19/self_attn/k_proj/MatMul_output_0"/blocks.19/self_attn/k_proj/MatMul"MatMul  */blocks.19/input_layernorm/Cast_2_output_0 onnx::MatMul_9099+/blocks.19/self_attn/v_proj/MatMul_output_0"/blocks.19/self_attn/v_proj/MatMul"MatMul fonnx::Unsqueeze_5896 Constant_7546"Constant*5 value*)BConstant_7546_attr::valueJ  $/blocks.19/self_attn/Gather_output_0 onnx::Unsqueeze_5896'/blocks.19/self_attn/Unsqueeze_output_0/blocks.19/self_attn/Unsqueeze" Unsqueeze fonnx::Unsqueeze_5898 Constant_7548"Constant*5 value*)BConstant_7548_attr::valueJ  &/blocks.19/self_attn/Gather_1_output_0 onnx::Unsqueeze_5898)/blocks.19/self_attn/Unsqueeze_1_output_0 /blocks.19/self_attn/Unsqueeze_1" Unsqueeze (/blocks.19/self_attn/Constant_2_output_0/blocks.19/self_attn/Constant_2"Constant*G value*;B+/blocks.19/self_attn/Constant_2_attr::valueJ (/blocks.19/self_attn/Constant_3_output_0/blocks.19/self_attn/Constant_3"Constant*G value*;B+/blocks.19/self_attn/Constant_3_attr::valueJ  '/blocks.19/self_attn/Unsqueeze_output_0 )/blocks.19/self_attn/Unsqueeze_1_output_0 (/blocks.19/self_attn/Constant_2_output_0 (/blocks.19/self_attn/Constant_3_output_0$/blocks.19/self_attn/Concat_output_0/blocks.19/self_attn/Concat"Concat* axis  +/blocks.19/self_attn/q_proj/MatMul_output_0 $/blocks.19/self_attn/Concat_output_0%/blocks.19/self_attn/Reshape_output_0/blocks.19/self_attn/Reshape"Reshape* allowzero fonnx::Unsqueeze_5906 Constant_7554"Constant*5 value*)BConstant_7554_attr::valueJ  $/blocks.19/self_attn/Gather_output_0 onnx::Unsqueeze_5906)/blocks.19/self_attn/Unsqueeze_2_output_0 /blocks.19/self_attn/Unsqueeze_2" Unsqueeze fonnx::Unsqueeze_5908 Constant_7556"Constant*5 value*)BConstant_7556_attr::valueJ  &/blocks.19/self_attn/Gather_1_output_0 onnx::Unsqueeze_5908)/blocks.19/self_attn/Unsqueeze_3_output_0 /blocks.19/self_attn/Unsqueeze_3" Unsqueeze (/blocks.19/self_attn/Constant_4_output_0/blocks.19/self_attn/Constant_4"Constant*G value*;B+/blocks.19/self_attn/Constant_4_attr::valueJ (/blocks.19/self_attn/Constant_5_output_0/blocks.19/self_attn/Constant_5"Constant*G value*;B+/blocks.19/self_attn/Constant_5_attr::valueJ  )/blocks.19/self_attn/Unsqueeze_2_output_0 )/blocks.19/self_attn/Unsqueeze_3_output_0 (/blocks.19/self_attn/Constant_4_output_0 (/blocks.19/self_attn/Constant_5_output_0&/blocks.19/self_attn/Concat_1_output_0/blocks.19/self_attn/Concat_1"Concat* axis fonnx::Unsqueeze_5915 Constant_7561"Constant*5 value*)BConstant_7561_attr::valueJ  $/blocks.19/self_attn/Gather_output_0 onnx::Unsqueeze_5915)/blocks.19/self_attn/Unsqueeze_4_output_0 /blocks.19/self_attn/Unsqueeze_4" Unsqueeze fonnx::Unsqueeze_5917 Constant_7563"Constant*5 value*)BConstant_7563_attr::valueJ  &/blocks.19/self_attn/Gather_1_output_0 onnx::Unsqueeze_5917)/blocks.19/self_attn/Unsqueeze_5_output_0 /blocks.19/self_attn/Unsqueeze_5" Unsqueeze (/blocks.19/self_attn/Constant_6_output_0/blocks.19/self_attn/Constant_6"Constant*G value*;B+/blocks.19/self_attn/Constant_6_attr::valueJ (/blocks.19/self_attn/Constant_7_output_0/blocks.19/self_attn/Constant_7"Constant*G value*;B+/blocks.19/self_attn/Constant_7_attr::valueJ  )/blocks.19/self_attn/Unsqueeze_4_output_0 )/blocks.19/self_attn/Unsqueeze_5_output_0 (/blocks.19/self_attn/Constant_6_output_0 (/blocks.19/self_attn/Constant_7_output_0&/blocks.19/self_attn/Concat_2_output_0/blocks.19/self_attn/Concat_2"Concat* axis  +/blocks.19/self_attn/k_proj/MatMul_output_0 &/blocks.19/self_attn/Concat_1_output_0'/blocks.19/self_attn/Reshape_1_output_0/blocks.19/self_attn/Reshape_1"Reshape* allowzero  +/blocks.19/self_attn/v_proj/MatMul_output_0 &/blocks.19/self_attn/Concat_2_output_0'/blocks.19/self_attn/Reshape_2_output_0/blocks.19/self_attn/Reshape_2"Reshape* allowzero  %/blocks.19/self_attn/Reshape_output_0)/blocks.19/self_attn/q_norm/Cast_output_0 /blocks.19/self_attn/q_norm/Cast"Cast* to -/blocks.19/self_attn/q_norm/Constant_output_0$/blocks.19/self_attn/q_norm/Constant"Constant*F value*:B0/blocks.19/self_attn/q_norm/Constant_attr::valueJ@  )/blocks.19/self_attn/q_norm/Cast_output_0 -/blocks.19/self_attn/q_norm/Constant_output_0(/blocks.19/self_attn/q_norm/Pow_output_0/blocks.19/self_attn/q_norm/Pow"Pow  (/blocks.19/self_attn/q_norm/Pow_output_0//blocks.19/self_attn/q_norm/ReduceMean_output_0&/blocks.19/self_attn/q_norm/ReduceMean" ReduceMean* axes@* keepdims //blocks.19/self_attn/q_norm/Constant_1_output_0&/blocks.19/self_attn/q_norm/Constant_1"Constant*H value*<B2/blocks.19/self_attn/q_norm/Constant_1_attr::valueJ75  //blocks.19/self_attn/q_norm/ReduceMean_output_0 //blocks.19/self_attn/q_norm/Constant_1_output_0(/blocks.19/self_attn/q_norm/Add_output_0/blocks.19/self_attn/q_norm/Add"Add } (/blocks.19/self_attn/q_norm/Add_output_0)/blocks.19/self_attn/q_norm/Sqrt_output_0 /blocks.19/self_attn/q_norm/Sqrt"Sqrt //blocks.19/self_attn/q_norm/Constant_2_output_0&/blocks.19/self_attn/q_norm/Constant_2"Constant*H value*<B2/blocks.19/self_attn/q_norm/Constant_2_attr::valueJ?  //blocks.19/self_attn/q_norm/Constant_2_output_0 )/blocks.19/self_attn/q_norm/Sqrt_output_0(/blocks.19/self_attn/q_norm/Div_output_0/blocks.19/self_attn/q_norm/Div"Div  )/blocks.19/self_attn/q_norm/Cast_output_0+/blocks.19/self_attn/q_norm/Cast_1_output_0"/blocks.19/self_attn/q_norm/Cast_1"Cast* to  +/blocks.19/self_attn/q_norm/Cast_1_output_0 (/blocks.19/self_attn/q_norm/Div_output_0(/blocks.19/self_attn/q_norm/Mul_output_0/blocks.19/self_attn/q_norm/Mul"Mul  (/blocks.19/self_attn/q_norm/Mul_output_0 !blocks.19.self_attn.q_norm.weight*/blocks.19/self_attn/q_norm/Mul_1_output_0!/blocks.19/self_attn/q_norm/Mul_1"Mul  */blocks.19/self_attn/q_norm/Mul_1_output_0+/blocks.19/self_attn/q_norm/Cast_2_output_0"/blocks.19/self_attn/q_norm/Cast_2"Cast* to  '/blocks.19/self_attn/Reshape_1_output_0)/blocks.19/self_attn/k_norm/Cast_output_0 /blocks.19/self_attn/k_norm/Cast"Cast* to -/blocks.19/self_attn/k_norm/Constant_output_0$/blocks.19/self_attn/k_norm/Constant"Constant*F value*:B0/blocks.19/self_attn/k_norm/Constant_attr::valueJ@  )/blocks.19/self_attn/k_norm/Cast_output_0 -/blocks.19/self_attn/k_norm/Constant_output_0(/blocks.19/self_attn/k_norm/Pow_output_0/blocks.19/self_attn/k_norm/Pow"Pow  (/blocks.19/self_attn/k_norm/Pow_output_0//blocks.19/self_attn/k_norm/ReduceMean_output_0&/blocks.19/self_attn/k_norm/ReduceMean" ReduceMean* axes@* keepdims //blocks.19/self_attn/k_norm/Constant_1_output_0&/blocks.19/self_attn/k_norm/Constant_1"Constant*H value*<B2/blocks.19/self_attn/k_norm/Constant_1_attr::valueJ75  //blocks.19/self_attn/k_norm/ReduceMean_output_0 //blocks.19/self_attn/k_norm/Constant_1_output_0(/blocks.19/self_attn/k_norm/Add_output_0/blocks.19/self_attn/k_norm/Add"Add } (/blocks.19/self_attn/k_norm/Add_output_0)/blocks.19/self_attn/k_norm/Sqrt_output_0 /blocks.19/self_attn/k_norm/Sqrt"Sqrt //blocks.19/self_attn/k_norm/Constant_2_output_0&/blocks.19/self_attn/k_norm/Constant_2"Constant*H value*<B2/blocks.19/self_attn/k_norm/Constant_2_attr::valueJ?  //blocks.19/self_attn/k_norm/Constant_2_output_0 )/blocks.19/self_attn/k_norm/Sqrt_output_0(/blocks.19/self_attn/k_norm/Div_output_0/blocks.19/self_attn/k_norm/Div"Div  )/blocks.19/self_attn/k_norm/Cast_output_0+/blocks.19/self_attn/k_norm/Cast_1_output_0"/blocks.19/self_attn/k_norm/Cast_1"Cast* to  +/blocks.19/self_attn/k_norm/Cast_1_output_0 (/blocks.19/self_attn/k_norm/Div_output_0(/blocks.19/self_attn/k_norm/Mul_output_0/blocks.19/self_attn/k_norm/Mul"Mul  (/blocks.19/self_attn/k_norm/Mul_output_0 !blocks.19.self_attn.k_norm.weight*/blocks.19/self_attn/k_norm/Mul_1_output_0!/blocks.19/self_attn/k_norm/Mul_1"Mul  */blocks.19/self_attn/k_norm/Mul_1_output_0+/blocks.19/self_attn/k_norm/Cast_2_output_0"/blocks.19/self_attn/k_norm/Cast_2"Cast* to  +/blocks.19/self_attn/q_norm/Cast_2_output_0 %/blocks.0/self_attn/Gather_2_output_0!/blocks.19/self_attn/Mul_output_0/blocks.19/self_attn/Mul"Mul y +/blocks.19/self_attn/q_norm/Cast_2_output_0%/blocks.19/self_attn/Shape_2_output_0/blocks.19/self_attn/Shape_2"Shape (/blocks.19/self_attn/Constant_8_output_0/blocks.19/self_attn/Constant_8"Constant*E value*9B+/blocks.19/self_attn/Constant_8_attr::valueJ  %/blocks.19/self_attn/Shape_2_output_0 (/blocks.19/self_attn/Constant_8_output_0&/blocks.19/self_attn/Gather_2_output_0/blocks.19/self_attn/Gather_2"Gather* axis (/blocks.19/self_attn/Constant_9_output_0/blocks.19/self_attn/Constant_9"Constant*E value*9B+/blocks.19/self_attn/Constant_9_attr::valueJ  &/blocks.19/self_attn/Gather_2_output_0 (/blocks.19/self_attn/Constant_9_output_0!/blocks.19/self_attn/Div_output_0/blocks.19/self_attn/Div"Div s !/blocks.19/self_attn/Div_output_0"/blocks.19/self_attn/Cast_output_0/blocks.19/self_attn/Cast"Cast* to x "/blocks.19/self_attn/Cast_output_0$/blocks.19/self_attn/Cast_1_output_0/blocks.19/self_attn/Cast_1"Cast* to )/blocks.19/self_attn/Constant_10_output_0 /blocks.19/self_attn/Constant_10"Constant*H value*<B,/blocks.19/self_attn/Constant_10_attr::valueJ )/blocks.19/self_attn/Constant_11_output_0 /blocks.19/self_attn/Constant_11"Constant*H value*<B,/blocks.19/self_attn/Constant_11_attr::valueJ )/blocks.19/self_attn/Constant_12_output_0 /blocks.19/self_attn/Constant_12"Constant*H value*<B,/blocks.19/self_attn/Constant_12_attr::valueJ  $/blocks.19/self_attn/Cast_1_output_0 )/blocks.19/self_attn/Constant_12_output_0)/blocks.19/self_attn/Unsqueeze_6_output_0 /blocks.19/self_attn/Unsqueeze_6" Unsqueeze )/blocks.19/self_attn/Constant_13_output_0 /blocks.19/self_attn/Constant_13"Constant*H value*<B,/blocks.19/self_attn/Constant_13_attr::valueJ  +/blocks.19/self_attn/q_norm/Cast_2_output_0 )/blocks.19/self_attn/Constant_11_output_0 )/blocks.19/self_attn/Unsqueeze_6_output_0 )/blocks.19/self_attn/Constant_10_output_0 )/blocks.19/self_attn/Constant_13_output_0#/blocks.19/self_attn/Slice_output_0/blocks.19/self_attn/Slice"Slice )/blocks.19/self_attn/Constant_14_output_0 /blocks.19/self_attn/Constant_14"Constant*H value*<B,/blocks.19/self_attn/Constant_14_attr::valueJ )/blocks.19/self_attn/Constant_15_output_0 /blocks.19/self_attn/Constant_15"Constant*H value*<B,/blocks.19/self_attn/Constant_15_attr::valueJ  $/blocks.19/self_attn/Cast_1_output_0 )/blocks.19/self_attn/Constant_15_output_0)/blocks.19/self_attn/Unsqueeze_7_output_0 /blocks.19/self_attn/Unsqueeze_7" Unsqueeze )/blocks.19/self_attn/Constant_16_output_0 /blocks.19/self_attn/Constant_16"Constant*H value*<B,/blocks.19/self_attn/Constant_16_attr::valueJ )/blocks.19/self_attn/Constant_17_output_0 /blocks.19/self_attn/Constant_17"Constant*H value*<B,/blocks.19/self_attn/Constant_17_attr::valueJ  +/blocks.19/self_attn/q_norm/Cast_2_output_0 )/blocks.19/self_attn/Unsqueeze_7_output_0 )/blocks.19/self_attn/Constant_16_output_0 )/blocks.19/self_attn/Constant_14_output_0 )/blocks.19/self_attn/Constant_17_output_0%/blocks.19/self_attn/Slice_1_output_0/blocks.19/self_attn/Slice_1"Slice i %/blocks.19/self_attn/Slice_1_output_0!/blocks.19/self_attn/Neg_output_0/blocks.19/self_attn/Neg"Neg  !/blocks.19/self_attn/Neg_output_0 #/blocks.19/self_attn/Slice_output_0&/blocks.19/self_attn/Concat_3_output_0/blocks.19/self_attn/Concat_3"Concat* axis  &/blocks.19/self_attn/Concat_3_output_0 %/blocks.0/self_attn/Gather_3_output_0#/blocks.19/self_attn/Mul_1_output_0/blocks.19/self_attn/Mul_1"Mul  !/blocks.19/self_attn/Mul_output_0 #/blocks.19/self_attn/Mul_1_output_0!/blocks.19/self_attn/Add_output_0/blocks.19/self_attn/Add"Add  +/blocks.19/self_attn/k_norm/Cast_2_output_0 %/blocks.0/self_attn/Gather_2_output_0#/blocks.19/self_attn/Mul_2_output_0/blocks.19/self_attn/Mul_2"Mul y +/blocks.19/self_attn/k_norm/Cast_2_output_0%/blocks.19/self_attn/Shape_3_output_0/blocks.19/self_attn/Shape_3"Shape )/blocks.19/self_attn/Constant_18_output_0 /blocks.19/self_attn/Constant_18"Constant*F value*:B,/blocks.19/self_attn/Constant_18_attr::valueJ  %/blocks.19/self_attn/Shape_3_output_0 )/blocks.19/self_attn/Constant_18_output_0&/blocks.19/self_attn/Gather_3_output_0/blocks.19/self_attn/Gather_3"Gather* axis )/blocks.19/self_attn/Constant_19_output_0 /blocks.19/self_attn/Constant_19"Constant*F value*:B,/blocks.19/self_attn/Constant_19_attr::valueJ  &/blocks.19/self_attn/Gather_3_output_0 )/blocks.19/self_attn/Constant_19_output_0#/blocks.19/self_attn/Div_1_output_0/blocks.19/self_attn/Div_1"Div y #/blocks.19/self_attn/Div_1_output_0$/blocks.19/self_attn/Cast_2_output_0/blocks.19/self_attn/Cast_2"Cast* to z $/blocks.19/self_attn/Cast_2_output_0$/blocks.19/self_attn/Cast_3_output_0/blocks.19/self_attn/Cast_3"Cast* to )/blocks.19/self_attn/Constant_20_output_0 /blocks.19/self_attn/Constant_20"Constant*H value*<B,/blocks.19/self_attn/Constant_20_attr::valueJ )/blocks.19/self_attn/Constant_21_output_0 /blocks.19/self_attn/Constant_21"Constant*H value*<B,/blocks.19/self_attn/Constant_21_attr::valueJ )/blocks.19/self_attn/Constant_22_output_0 /blocks.19/self_attn/Constant_22"Constant*H value*<B,/blocks.19/self_attn/Constant_22_attr::valueJ  $/blocks.19/self_attn/Cast_3_output_0 )/blocks.19/self_attn/Constant_22_output_0)/blocks.19/self_attn/Unsqueeze_8_output_0 /blocks.19/self_attn/Unsqueeze_8" Unsqueeze )/blocks.19/self_attn/Constant_23_output_0 /blocks.19/self_attn/Constant_23"Constant*H value*<B,/blocks.19/self_attn/Constant_23_attr::valueJ  +/blocks.19/self_attn/k_norm/Cast_2_output_0 )/blocks.19/self_attn/Constant_21_output_0 )/blocks.19/self_attn/Unsqueeze_8_output_0 )/blocks.19/self_attn/Constant_20_output_0 )/blocks.19/self_attn/Constant_23_output_0%/blocks.19/self_attn/Slice_2_output_0/blocks.19/self_attn/Slice_2"Slice )/blocks.19/self_attn/Constant_24_output_0 /blocks.19/self_attn/Constant_24"Constant*H value*<B,/blocks.19/self_attn/Constant_24_attr::valueJ )/blocks.19/self_attn/Constant_25_output_0 /blocks.19/self_attn/Constant_25"Constant*H value*<B,/blocks.19/self_attn/Constant_25_attr::valueJ  $/blocks.19/self_attn/Cast_3_output_0 )/blocks.19/self_attn/Constant_25_output_0)/blocks.19/self_attn/Unsqueeze_9_output_0 /blocks.19/self_attn/Unsqueeze_9" Unsqueeze )/blocks.19/self_attn/Constant_26_output_0 /blocks.19/self_attn/Constant_26"Constant*H value*<B,/blocks.19/self_attn/Constant_26_attr::valueJ )/blocks.19/self_attn/Constant_27_output_0 /blocks.19/self_attn/Constant_27"Constant*H value*<B,/blocks.19/self_attn/Constant_27_attr::valueJ  +/blocks.19/self_attn/k_norm/Cast_2_output_0 )/blocks.19/self_attn/Unsqueeze_9_output_0 )/blocks.19/self_attn/Constant_26_output_0 )/blocks.19/self_attn/Constant_24_output_0 )/blocks.19/self_attn/Constant_27_output_0%/blocks.19/self_attn/Slice_3_output_0/blocks.19/self_attn/Slice_3"Slice m %/blocks.19/self_attn/Slice_3_output_0#/blocks.19/self_attn/Neg_1_output_0/blocks.19/self_attn/Neg_1"Neg  #/blocks.19/self_attn/Neg_1_output_0 %/blocks.19/self_attn/Slice_2_output_0&/blocks.19/self_attn/Concat_4_output_0/blocks.19/self_attn/Concat_4"Concat* axis  &/blocks.19/self_attn/Concat_4_output_0 %/blocks.0/self_attn/Gather_3_output_0#/blocks.19/self_attn/Mul_3_output_0/blocks.19/self_attn/Mul_3"Mul  #/blocks.19/self_attn/Mul_2_output_0 #/blocks.19/self_attn/Mul_3_output_0#/blocks.19/self_attn/Add_1_output_0/blocks.19/self_attn/Add_1"Add  /Gather_19_output_0 /rotary/Constant_3_output_0&/blocks.19/self_attn/Gather_4_output_0/blocks.19/self_attn/Gather_4"Gather* axis  /Gather_19_output_0 /rotary/Constant_8_output_0&/blocks.19/self_attn/Gather_5_output_0/blocks.19/self_attn/Gather_5"Gather* axis  &/blocks.19/self_attn/Gather_4_output_0 #/blocks.19/self_attn/Add_1_output_0&/blocks.19/self_attn/Concat_5_output_0/blocks.19/self_attn/Concat_5"Concat* axis  &/blocks.19/self_attn/Gather_5_output_0 '/blocks.19/self_attn/Reshape_2_output_0&/blocks.19/self_attn/Concat_6_output_0/blocks.19/self_attn/Concat_6"Concat* axis )/blocks.19/self_attn/Constant_28_output_0 /blocks.19/self_attn/Constant_28"Constant*H value*<B,/blocks.19/self_attn/Constant_28_attr::valueJ  &/blocks.19/self_attn/Concat_5_output_0 )/blocks.19/self_attn/Constant_28_output_0*/blocks.19/self_attn/Unsqueeze_10_output_0!/blocks.19/self_attn/Unsqueeze_10" Unsqueeze )/blocks.19/self_attn/Constant_29_output_0 /blocks.19/self_attn/Constant_29"Constant*H value*<B,/blocks.19/self_attn/Constant_29_attr::valueJ  &/blocks.19/self_attn/Concat_6_output_0 )/blocks.19/self_attn/Constant_29_output_0*/blocks.19/self_attn/Unsqueeze_11_output_0!/blocks.19/self_attn/Unsqueeze_11" Unsqueeze  */blocks.19/self_attn/Unsqueeze_10_output_0 */blocks.19/self_attn/Unsqueeze_11_output_0&/blocks.19/self_attn/Concat_7_output_0/blocks.19/self_attn/Concat_7"Concat* axis  !/blocks.19/self_attn/Add_output_0'/blocks.19/self_attn/Transpose_output_0/blocks.19/self_attn/Transpose" Transpose* perm@@@@  &/blocks.19/self_attn/Concat_5_output_0)/blocks.19/self_attn/Transpose_1_output_0 /blocks.19/self_attn/Transpose_1" Transpose* perm@@@@  &/blocks.19/self_attn/Concat_6_output_0)/blocks.19/self_attn/Transpose_2_output_0 /blocks.19/self_attn/Transpose_2" Transpose* perm@@@@ w )/blocks.19/self_attn/Transpose_1_output_0%/blocks.19/self_attn/Shape_4_output_0/blocks.19/self_attn/Shape_4"Shape )/blocks.19/self_attn/Constant_30_output_0 /blocks.19/self_attn/Constant_30"Constant*F value*:B,/blocks.19/self_attn/Constant_30_attr::valueJ  %/blocks.19/self_attn/Shape_4_output_0 )/blocks.19/self_attn/Constant_30_output_0&/blocks.19/self_attn/Gather_6_output_0/blocks.19/self_attn/Gather_6"Gather* axis w )/blocks.19/self_attn/Transpose_1_output_0%/blocks.19/self_attn/Shape_5_output_0/blocks.19/self_attn/Shape_5"Shape )/blocks.19/self_attn/Constant_31_output_0 /blocks.19/self_attn/Constant_31"Constant*F value*:B,/blocks.19/self_attn/Constant_31_attr::valueJ  %/blocks.19/self_attn/Shape_5_output_0 )/blocks.19/self_attn/Constant_31_output_0&/blocks.19/self_attn/Gather_7_output_0/blocks.19/self_attn/Gather_7"Gather* axis w )/blocks.19/self_attn/Transpose_1_output_0%/blocks.19/self_attn/Shape_6_output_0/blocks.19/self_attn/Shape_6"Shape )/blocks.19/self_attn/Constant_32_output_0 /blocks.19/self_attn/Constant_32"Constant*F value*:B,/blocks.19/self_attn/Constant_32_attr::valueJ  %/blocks.19/self_attn/Shape_6_output_0 )/blocks.19/self_attn/Constant_32_output_0&/blocks.19/self_attn/Gather_8_output_0/blocks.19/self_attn/Gather_8"Gather* axis w )/blocks.19/self_attn/Transpose_1_output_0%/blocks.19/self_attn/Shape_7_output_0/blocks.19/self_attn/Shape_7"Shape )/blocks.19/self_attn/Constant_33_output_0 /blocks.19/self_attn/Constant_33"Constant*F value*:B,/blocks.19/self_attn/Constant_33_attr::valueJ  %/blocks.19/self_attn/Shape_7_output_0 )/blocks.19/self_attn/Constant_33_output_0&/blocks.19/self_attn/Gather_9_output_0/blocks.19/self_attn/Gather_9"Gather* axis )/blocks.19/self_attn/Constant_34_output_0 /blocks.19/self_attn/Constant_34"Constant*H value*<B,/blocks.19/self_attn/Constant_34_attr::valueJ  )/blocks.19/self_attn/Transpose_1_output_0 )/blocks.19/self_attn/Constant_34_output_0*/blocks.19/self_attn/Unsqueeze_12_output_0!/blocks.19/self_attn/Unsqueeze_12" Unsqueeze )/blocks.19/self_attn/Constant_35_output_0 /blocks.19/self_attn/Constant_35"Constant*H value*<B,/blocks.19/self_attn/Constant_35_attr::valueJ  &/blocks.19/self_attn/Gather_6_output_0 )/blocks.19/self_attn/Constant_35_output_0*/blocks.19/self_attn/Unsqueeze_13_output_0!/blocks.19/self_attn/Unsqueeze_13" Unsqueeze )/blocks.19/self_attn/Constant_36_output_0 /blocks.19/self_attn/Constant_36"Constant*H value*<B,/blocks.19/self_attn/Constant_36_attr::valueJ  &/blocks.19/self_attn/Gather_7_output_0 )/blocks.19/self_attn/Constant_36_output_0*/blocks.19/self_attn/Unsqueeze_14_output_0!/blocks.19/self_attn/Unsqueeze_14" Unsqueeze )/blocks.19/self_attn/Constant_37_output_0 /blocks.19/self_attn/Constant_37"Constant*H value*<B,/blocks.19/self_attn/Constant_37_attr::valueJ )/blocks.19/self_attn/Constant_38_output_0 /blocks.19/self_attn/Constant_38"Constant*H value*<B,/blocks.19/self_attn/Constant_38_attr::valueJ  &/blocks.19/self_attn/Gather_8_output_0 )/blocks.19/self_attn/Constant_38_output_0*/blocks.19/self_attn/Unsqueeze_15_output_0!/blocks.19/self_attn/Unsqueeze_15" Unsqueeze )/blocks.19/self_attn/Constant_39_output_0 /blocks.19/self_attn/Constant_39"Constant*H value*<B,/blocks.19/self_attn/Constant_39_attr::valueJ  &/blocks.19/self_attn/Gather_9_output_0 )/blocks.19/self_attn/Constant_39_output_0*/blocks.19/self_attn/Unsqueeze_16_output_0!/blocks.19/self_attn/Unsqueeze_16" Unsqueeze  */blocks.19/self_attn/Unsqueeze_13_output_0 */blocks.19/self_attn/Unsqueeze_14_output_0 )/blocks.19/self_attn/Constant_37_output_0 */blocks.19/self_attn/Unsqueeze_15_output_0 */blocks.19/self_attn/Unsqueeze_16_output_0&/blocks.19/self_attn/Concat_8_output_0/blocks.19/self_attn/Concat_8"Concat* axis )/blocks.19/self_attn/Constant_40_output_0 /blocks.19/self_attn/Constant_40"Constant*H value*<B,/blocks.19/self_attn/Constant_40_attr::valueJ  &/blocks.19/self_attn/Concat_8_output_0 )/blocks.19/self_attn/Constant_40_output_0'/blocks.19/self_attn/Reshape_3_output_0/blocks.19/self_attn/Reshape_3"Reshape* allowzero u '/blocks.19/self_attn/Reshape_3_output_0%/blocks.19/self_attn/Shape_8_output_0/blocks.19/self_attn/Shape_8"Shape  %/blocks.19/self_attn/Shape_8_output_0-/blocks.19/self_attn/ConstantOfShape_output_0$/blocks.19/self_attn/ConstantOfShape"ConstantOfShape*L value*@B0/blocks.19/self_attn/ConstantOfShape_attr::valueJ )/blocks.19/self_attn/Constant_41_output_0 /blocks.19/self_attn/Constant_41"Constant*F value*:B,/blocks.19/self_attn/Constant_41_attr::valueJ  -/blocks.19/self_attn/ConstantOfShape_output_0 )/blocks.19/self_attn/Constant_41_output_0#/blocks.19/self_attn/Mul_4_output_0/blocks.19/self_attn/Mul_4"Mul  '/blocks.19/self_attn/Reshape_3_output_0 #/blocks.19/self_attn/Mul_4_output_0#/blocks.19/self_attn/Equal_output_0/blocks.19/self_attn/Equal"Equal  #/blocks.19/self_attn/Equal_output_0 -/blocks.19/self_attn/ConstantOfShape_output_0 '/blocks.19/self_attn/Reshape_3_output_0#/blocks.19/self_attn/Where_output_0/blocks.19/self_attn/Where"Where  */blocks.19/self_attn/Unsqueeze_12_output_0 #/blocks.19/self_attn/Where_output_0$/blocks.19/self_attn/Expand_output_0/blocks.19/self_attn/Expand"Expand )/blocks.19/self_attn/Constant_42_output_0 /blocks.19/self_attn/Constant_42"Constant*F value*:B,/blocks.19/self_attn/Constant_42_attr::valueJ  &/blocks.19/self_attn/Gather_7_output_0 )/blocks.19/self_attn/Constant_42_output_0#/blocks.19/self_attn/Mul_5_output_0/blocks.19/self_attn/Mul_5"Mul fonnx::Unsqueeze_6060 Constant_7691"Constant*5 value*)BConstant_7691_attr::valueJ  &/blocks.19/self_attn/Gather_6_output_0 onnx::Unsqueeze_6060*/blocks.19/self_attn/Unsqueeze_17_output_0!/blocks.19/self_attn/Unsqueeze_17" Unsqueeze fonnx::Unsqueeze_6062 Constant_7693"Constant*5 value*)BConstant_7693_attr::valueJ  #/blocks.19/self_attn/Mul_5_output_0 onnx::Unsqueeze_6062*/blocks.19/self_attn/Unsqueeze_18_output_0!/blocks.19/self_attn/Unsqueeze_18" Unsqueeze fonnx::Unsqueeze_6064 Constant_7695"Constant*5 value*)BConstant_7695_attr::valueJ  &/blocks.19/self_attn/Gather_8_output_0 onnx::Unsqueeze_6064*/blocks.19/self_attn/Unsqueeze_19_output_0!/blocks.19/self_attn/Unsqueeze_19" Unsqueeze fonnx::Unsqueeze_6066 Constant_7697"Constant*5 value*)BConstant_7697_attr::valueJ  &/blocks.19/self_attn/Gather_9_output_0 onnx::Unsqueeze_6066*/blocks.19/self_attn/Unsqueeze_20_output_0!/blocks.19/self_attn/Unsqueeze_20" Unsqueeze  */blocks.19/self_attn/Unsqueeze_17_output_0 */blocks.19/self_attn/Unsqueeze_18_output_0 */blocks.19/self_attn/Unsqueeze_19_output_0 */blocks.19/self_attn/Unsqueeze_20_output_0&/blocks.19/self_attn/Concat_9_output_0/blocks.19/self_attn/Concat_9"Concat* axis  $/blocks.19/self_attn/Expand_output_0 &/blocks.19/self_attn/Concat_9_output_0'/blocks.19/self_attn/Reshape_4_output_0/blocks.19/self_attn/Reshape_4"Reshape* allowzero w )/blocks.19/self_attn/Transpose_2_output_0%/blocks.19/self_attn/Shape_9_output_0/blocks.19/self_attn/Shape_9"Shape )/blocks.19/self_attn/Constant_43_output_0 /blocks.19/self_attn/Constant_43"Constant*F value*:B,/blocks.19/self_attn/Constant_43_attr::valueJ  %/blocks.19/self_attn/Shape_9_output_0 )/blocks.19/self_attn/Constant_43_output_0'/blocks.19/self_attn/Gather_10_output_0/blocks.19/self_attn/Gather_10"Gather* axis y )/blocks.19/self_attn/Transpose_2_output_0&/blocks.19/self_attn/Shape_10_output_0/blocks.19/self_attn/Shape_10"Shape )/blocks.19/self_attn/Constant_44_output_0 /blocks.19/self_attn/Constant_44"Constant*F value*:B,/blocks.19/self_attn/Constant_44_attr::valueJ  &/blocks.19/self_attn/Shape_10_output_0 )/blocks.19/self_attn/Constant_44_output_0'/blocks.19/self_attn/Gather_11_output_0/blocks.19/self_attn/Gather_11"Gather* axis y )/blocks.19/self_attn/Transpose_2_output_0&/blocks.19/self_attn/Shape_11_output_0/blocks.19/self_attn/Shape_11"Shape )/blocks.19/self_attn/Constant_45_output_0 /blocks.19/self_attn/Constant_45"Constant*F value*:B,/blocks.19/self_attn/Constant_45_attr::valueJ  &/blocks.19/self_attn/Shape_11_output_0 )/blocks.19/self_attn/Constant_45_output_0'/blocks.19/self_attn/Gather_12_output_0/blocks.19/self_attn/Gather_12"Gather* axis y )/blocks.19/self_attn/Transpose_2_output_0&/blocks.19/self_attn/Shape_12_output_0/blocks.19/self_attn/Shape_12"Shape )/blocks.19/self_attn/Constant_46_output_0 /blocks.19/self_attn/Constant_46"Constant*F value*:B,/blocks.19/self_attn/Constant_46_attr::valueJ  &/blocks.19/self_attn/Shape_12_output_0 )/blocks.19/self_attn/Constant_46_output_0'/blocks.19/self_attn/Gather_13_output_0/blocks.19/self_attn/Gather_13"Gather* axis )/blocks.19/self_attn/Constant_47_output_0 /blocks.19/self_attn/Constant_47"Constant*H value*<B,/blocks.19/self_attn/Constant_47_attr::valueJ  )/blocks.19/self_attn/Transpose_2_output_0 )/blocks.19/self_attn/Constant_47_output_0*/blocks.19/self_attn/Unsqueeze_21_output_0!/blocks.19/self_attn/Unsqueeze_21" Unsqueeze )/blocks.19/self_attn/Constant_48_output_0 /blocks.19/self_attn/Constant_48"Constant*H value*<B,/blocks.19/self_attn/Constant_48_attr::valueJ  '/blocks.19/self_attn/Gather_10_output_0 )/blocks.19/self_attn/Constant_48_output_0*/blocks.19/self_attn/Unsqueeze_22_output_0!/blocks.19/self_attn/Unsqueeze_22" Unsqueeze )/blocks.19/self_attn/Constant_49_output_0 /blocks.19/self_attn/Constant_49"Constant*H value*<B,/blocks.19/self_attn/Constant_49_attr::valueJ  '/blocks.19/self_attn/Gather_11_output_0 )/blocks.19/self_attn/Constant_49_output_0*/blocks.19/self_attn/Unsqueeze_23_output_0!/blocks.19/self_attn/Unsqueeze_23" Unsqueeze )/blocks.19/self_attn/Constant_50_output_0 /blocks.19/self_attn/Constant_50"Constant*H value*<B,/blocks.19/self_attn/Constant_50_attr::valueJ )/blocks.19/self_attn/Constant_51_output_0 /blocks.19/self_attn/Constant_51"Constant*H value*<B,/blocks.19/self_attn/Constant_51_attr::valueJ  '/blocks.19/self_attn/Gather_12_output_0 )/blocks.19/self_attn/Constant_51_output_0*/blocks.19/self_attn/Unsqueeze_24_output_0!/blocks.19/self_attn/Unsqueeze_24" Unsqueeze )/blocks.19/self_attn/Constant_52_output_0 /blocks.19/self_attn/Constant_52"Constant*H value*<B,/blocks.19/self_attn/Constant_52_attr::valueJ  '/blocks.19/self_attn/Gather_13_output_0 )/blocks.19/self_attn/Constant_52_output_0*/blocks.19/self_attn/Unsqueeze_25_output_0!/blocks.19/self_attn/Unsqueeze_25" Unsqueeze  */blocks.19/self_attn/Unsqueeze_22_output_0 */blocks.19/self_attn/Unsqueeze_23_output_0 )/blocks.19/self_attn/Constant_50_output_0 */blocks.19/self_attn/Unsqueeze_24_output_0 */blocks.19/self_attn/Unsqueeze_25_output_0'/blocks.19/self_attn/Concat_10_output_0/blocks.19/self_attn/Concat_10"Concat* axis )/blocks.19/self_attn/Constant_53_output_0 /blocks.19/self_attn/Constant_53"Constant*H value*<B,/blocks.19/self_attn/Constant_53_attr::valueJ  '/blocks.19/self_attn/Concat_10_output_0 )/blocks.19/self_attn/Constant_53_output_0'/blocks.19/self_attn/Reshape_5_output_0/blocks.19/self_attn/Reshape_5"Reshape* allowzero w '/blocks.19/self_attn/Reshape_5_output_0&/blocks.19/self_attn/Shape_13_output_0/blocks.19/self_attn/Shape_13"Shape  &/blocks.19/self_attn/Shape_13_output_0//blocks.19/self_attn/ConstantOfShape_1_output_0&/blocks.19/self_attn/ConstantOfShape_1"ConstantOfShape*N value*BB2/blocks.19/self_attn/ConstantOfShape_1_attr::valueJ )/blocks.19/self_attn/Constant_54_output_0 /blocks.19/self_attn/Constant_54"Constant*F value*:B,/blocks.19/self_attn/Constant_54_attr::valueJ  //blocks.19/self_attn/ConstantOfShape_1_output_0 )/blocks.19/self_attn/Constant_54_output_0#/blocks.19/self_attn/Mul_6_output_0/blocks.19/self_attn/Mul_6"Mul  '/blocks.19/self_attn/Reshape_5_output_0 #/blocks.19/self_attn/Mul_6_output_0%/blocks.19/self_attn/Equal_1_output_0/blocks.19/self_attn/Equal_1"Equal  %/blocks.19/self_attn/Equal_1_output_0 //blocks.19/self_attn/ConstantOfShape_1_output_0 '/blocks.19/self_attn/Reshape_5_output_0%/blocks.19/self_attn/Where_1_output_0/blocks.19/self_attn/Where_1"Where  */blocks.19/self_attn/Unsqueeze_21_output_0 %/blocks.19/self_attn/Where_1_output_0&/blocks.19/self_attn/Expand_1_output_0/blocks.19/self_attn/Expand_1"Expand )/blocks.19/self_attn/Constant_55_output_0 /blocks.19/self_attn/Constant_55"Constant*F value*:B,/blocks.19/self_attn/Constant_55_attr::valueJ  '/blocks.19/self_attn/Gather_11_output_0 )/blocks.19/self_attn/Constant_55_output_0#/blocks.19/self_attn/Mul_7_output_0/blocks.19/self_attn/Mul_7"Mul fonnx::Unsqueeze_6106 Constant_7736"Constant*5 value*)BConstant_7736_attr::valueJ  '/blocks.19/self_attn/Gather_10_output_0 onnx::Unsqueeze_6106*/blocks.19/self_attn/Unsqueeze_26_output_0!/blocks.19/self_attn/Unsqueeze_26" Unsqueeze fonnx::Unsqueeze_6108 Constant_7738"Constant*5 value*)BConstant_7738_attr::valueJ  #/blocks.19/self_attn/Mul_7_output_0 onnx::Unsqueeze_6108*/blocks.19/self_attn/Unsqueeze_27_output_0!/blocks.19/self_attn/Unsqueeze_27" Unsqueeze fonnx::Unsqueeze_6110 Constant_7740"Constant*5 value*)BConstant_7740_attr::valueJ  '/blocks.19/self_attn/Gather_12_output_0 onnx::Unsqueeze_6110*/blocks.19/self_attn/Unsqueeze_28_output_0!/blocks.19/self_attn/Unsqueeze_28" Unsqueeze fonnx::Unsqueeze_6112 Constant_7742"Constant*5 value*)BConstant_7742_attr::valueJ  '/blocks.19/self_attn/Gather_13_output_0 onnx::Unsqueeze_6112*/blocks.19/self_attn/Unsqueeze_29_output_0!/blocks.19/self_attn/Unsqueeze_29" Unsqueeze  */blocks.19/self_attn/Unsqueeze_26_output_0 */blocks.19/self_attn/Unsqueeze_27_output_0 */blocks.19/self_attn/Unsqueeze_28_output_0 */blocks.19/self_attn/Unsqueeze_29_output_0'/blocks.19/self_attn/Concat_11_output_0/blocks.19/self_attn/Concat_11"Concat* axis  &/blocks.19/self_attn/Expand_1_output_0 '/blocks.19/self_attn/Concat_11_output_0'/blocks.19/self_attn/Reshape_6_output_0/blocks.19/self_attn/Reshape_6"Reshape* allowzero  '/blocks.19/self_attn/Transpose_output_0 '/blocks.19/self_attn/Reshape_4_output_0$/blocks.19/self_attn/MatMul_output_0/blocks.19/self_attn/MatMul"MatMul )/blocks.19/self_attn/Constant_56_output_0 /blocks.19/self_attn/Constant_56"Constant*B value*6B,/blocks.19/self_attn/Constant_56_attr::valueJ5A  $/blocks.19/self_attn/MatMul_output_0 )/blocks.19/self_attn/Constant_56_output_0#/blocks.19/self_attn/Div_2_output_0/blocks.19/self_attn/Div_2"Div { #/blocks.19/self_attn/Div_2_output_0 attention_mask#/blocks.19/self_attn/Add_2_output_0/blocks.19/self_attn/Add_2"Add  #/blocks.19/self_attn/Add_2_output_0%/blocks.19/self_attn/Softmax_output_0/blocks.19/self_attn/Softmax"Softmax* axis { %/blocks.19/self_attn/Softmax_output_0$/blocks.19/self_attn/Cast_4_output_0/blocks.19/self_attn/Cast_4"Cast* to  $/blocks.19/self_attn/Cast_4_output_0 '/blocks.19/self_attn/Reshape_6_output_0&/blocks.19/self_attn/MatMul_1_output_0/blocks.19/self_attn/MatMul_1"MatMul  &/blocks.19/self_attn/MatMul_1_output_0)/blocks.19/self_attn/Transpose_3_output_0 /blocks.19/self_attn/Transpose_3" Transpose* perm@@@@ fonnx::Unsqueeze_6124 Constant_7754"Constant*5 value*)BConstant_7754_attr::valueJ  $/blocks.19/self_attn/Gather_output_0 onnx::Unsqueeze_6124*/blocks.19/self_attn/Unsqueeze_30_output_0!/blocks.19/self_attn/Unsqueeze_30" Unsqueeze fonnx::Unsqueeze_6126 Constant_7756"Constant*5 value*)BConstant_7756_attr::valueJ  &/blocks.19/self_attn/Gather_1_output_0 onnx::Unsqueeze_6126*/blocks.19/self_attn/Unsqueeze_31_output_0!/blocks.19/self_attn/Unsqueeze_31" Unsqueeze )/blocks.19/self_attn/Constant_57_output_0 /blocks.19/self_attn/Constant_57"Constant*H value*<B,/blocks.19/self_attn/Constant_57_attr::valueJ  */blocks.19/self_attn/Unsqueeze_30_output_0 */blocks.19/self_attn/Unsqueeze_31_output_0 )/blocks.19/self_attn/Constant_57_output_0'/blocks.19/self_attn/Concat_12_output_0/blocks.19/self_attn/Concat_12"Concat* axis  )/blocks.19/self_attn/Transpose_3_output_0 '/blocks.19/self_attn/Concat_12_output_0'/blocks.19/self_attn/Reshape_7_output_0/blocks.19/self_attn/Reshape_7"Reshape* allowzero  '/blocks.19/self_attn/Reshape_7_output_0 onnx::MatMul_9121+/blocks.19/self_attn/o_proj/MatMul_output_0"/blocks.19/self_attn/o_proj/MatMul"MatMul  */blocks.19/input_layernorm/Cast_1_output_0 +/blocks.19/self_attn/o_proj/MatMul_output_0/blocks.19/Add_output_0/blocks.19/Add"Add  /blocks.19/Add_output_01/blocks.19/post_attention_layernorm/Cast_output_0(/blocks.19/post_attention_layernorm/Cast"Cast* to 5/blocks.19/post_attention_layernorm/Constant_output_0,/blocks.19/post_attention_layernorm/Constant"Constant*N value*BB8/blocks.19/post_attention_layernorm/Constant_attr::valueJ@  1/blocks.19/post_attention_layernorm/Cast_output_0 5/blocks.19/post_attention_layernorm/Constant_output_00/blocks.19/post_attention_layernorm/Pow_output_0'/blocks.19/post_attention_layernorm/Pow"Pow  0/blocks.19/post_attention_layernorm/Pow_output_07/blocks.19/post_attention_layernorm/ReduceMean_output_0./blocks.19/post_attention_layernorm/ReduceMean" ReduceMean* axes@* keepdims 7/blocks.19/post_attention_layernorm/Constant_1_output_0./blocks.19/post_attention_layernorm/Constant_1"Constant*P value*DB:/blocks.19/post_attention_layernorm/Constant_1_attr::valueJ75  7/blocks.19/post_attention_layernorm/ReduceMean_output_0 7/blocks.19/post_attention_layernorm/Constant_1_output_00/blocks.19/post_attention_layernorm/Add_output_0'/blocks.19/post_attention_layernorm/Add"Add  0/blocks.19/post_attention_layernorm/Add_output_01/blocks.19/post_attention_layernorm/Sqrt_output_0(/blocks.19/post_attention_layernorm/Sqrt"Sqrt 7/blocks.19/post_attention_layernorm/Constant_2_output_0./blocks.19/post_attention_layernorm/Constant_2"Constant*P value*DB:/blocks.19/post_attention_layernorm/Constant_2_attr::valueJ?  7/blocks.19/post_attention_layernorm/Constant_2_output_0 1/blocks.19/post_attention_layernorm/Sqrt_output_00/blocks.19/post_attention_layernorm/Div_output_0'/blocks.19/post_attention_layernorm/Div"Div  1/blocks.19/post_attention_layernorm/Cast_output_03/blocks.19/post_attention_layernorm/Cast_1_output_0*/blocks.19/post_attention_layernorm/Cast_1"Cast* to  3/blocks.19/post_attention_layernorm/Cast_1_output_0 0/blocks.19/post_attention_layernorm/Div_output_00/blocks.19/post_attention_layernorm/Mul_output_0'/blocks.19/post_attention_layernorm/Mul"Mul  0/blocks.19/post_attention_layernorm/Mul_output_0 )blocks.19.post_attention_layernorm.weight2/blocks.19/post_attention_layernorm/Mul_1_output_0)/blocks.19/post_attention_layernorm/Mul_1"Mul  2/blocks.19/post_attention_layernorm/Mul_1_output_03/blocks.19/post_attention_layernorm/Cast_2_output_0*/blocks.19/post_attention_layernorm/Cast_2"Cast* to  3/blocks.19/post_attention_layernorm/Cast_2_output_0 onnx::MatMul_9122(/blocks.19/mlp/gate_proj/MatMul_output_0/blocks.19/mlp/gate_proj/MatMul"MatMul z (/blocks.19/mlp/gate_proj/MatMul_output_0&/blocks.19/mlp/act_fn/Sigmoid_output_0/blocks.19/mlp/act_fn/Sigmoid"Sigmoid  (/blocks.19/mlp/gate_proj/MatMul_output_0 &/blocks.19/mlp/act_fn/Sigmoid_output_0"/blocks.19/mlp/act_fn/Mul_output_0/blocks.19/mlp/act_fn/Mul"Mul  3/blocks.19/post_attention_layernorm/Cast_2_output_0 onnx::MatMul_9123&/blocks.19/mlp/up_proj/MatMul_output_0/blocks.19/mlp/up_proj/MatMul"MatMul  "/blocks.19/mlp/act_fn/Mul_output_0 &/blocks.19/mlp/up_proj/MatMul_output_0/blocks.19/mlp/Mul_output_0/blocks.19/mlp/Mul"Mul  /blocks.19/mlp/Mul_output_0 onnx::MatMul_9124(/blocks.19/mlp/down_proj/MatMul_output_0/blocks.19/mlp/down_proj/MatMul"MatMul  3/blocks.19/post_attention_layernorm/Cast_1_output_0 (/blocks.19/mlp/down_proj/MatMul_output_0/blocks.19/Add_1_output_0/blocks.19/Add_1"Add c/Constant_12_output_0 /Constant_12"Constant*2 value*&B/Constant_12_attr::valueJ ^ past_key_values /Constant_12_output_0/Gather_20_output_0 /Gather_20"Gather* axis /blocks.20/Constant_output_0/blocks.20/Constant"Constant*K value*?B/blocks.20/Constant_attr::valueJ  /blocks.19/Add_1_output_0 /blocks.20/Constant_output_0/blocks.20/Reshape_output_0/blocks.20/Reshape"Reshape* allowzero y /blocks.20/Reshape_output_0(/blocks.20/input_layernorm/Cast_output_0/blocks.20/input_layernorm/Cast"Cast* to ,/blocks.20/input_layernorm/Constant_output_0#/blocks.20/input_layernorm/Constant"Constant*E value*9B//blocks.20/input_layernorm/Constant_attr::valueJ@  (/blocks.20/input_layernorm/Cast_output_0 ,/blocks.20/input_layernorm/Constant_output_0'/blocks.20/input_layernorm/Pow_output_0/blocks.20/input_layernorm/Pow"Pow  '/blocks.20/input_layernorm/Pow_output_0./blocks.20/input_layernorm/ReduceMean_output_0%/blocks.20/input_layernorm/ReduceMean" ReduceMean* axes@* keepdims ./blocks.20/input_layernorm/Constant_1_output_0%/blocks.20/input_layernorm/Constant_1"Constant*G value*;B1/blocks.20/input_layernorm/Constant_1_attr::valueJ75  ./blocks.20/input_layernorm/ReduceMean_output_0 ./blocks.20/input_layernorm/Constant_1_output_0'/blocks.20/input_layernorm/Add_output_0/blocks.20/input_layernorm/Add"Add z '/blocks.20/input_layernorm/Add_output_0(/blocks.20/input_layernorm/Sqrt_output_0/blocks.20/input_layernorm/Sqrt"Sqrt ./blocks.20/input_layernorm/Constant_2_output_0%/blocks.20/input_layernorm/Constant_2"Constant*G value*;B1/blocks.20/input_layernorm/Constant_2_attr::valueJ?  ./blocks.20/input_layernorm/Constant_2_output_0 (/blocks.20/input_layernorm/Sqrt_output_0'/blocks.20/input_layernorm/Div_output_0/blocks.20/input_layernorm/Div"Div  (/blocks.20/input_layernorm/Cast_output_0*/blocks.20/input_layernorm/Cast_1_output_0!/blocks.20/input_layernorm/Cast_1"Cast* to  */blocks.20/input_layernorm/Cast_1_output_0 '/blocks.20/input_layernorm/Div_output_0'/blocks.20/input_layernorm/Mul_output_0/blocks.20/input_layernorm/Mul"Mul  '/blocks.20/input_layernorm/Mul_output_0 blocks.20.input_layernorm.weight)/blocks.20/input_layernorm/Mul_1_output_0 /blocks.20/input_layernorm/Mul_1"Mul  )/blocks.20/input_layernorm/Mul_1_output_0*/blocks.20/input_layernorm/Cast_2_output_0!/blocks.20/input_layernorm/Cast_2"Cast* to t */blocks.20/input_layernorm/Cast_2_output_0#/blocks.20/self_attn/Shape_output_0/blocks.20/self_attn/Shape"Shape &/blocks.20/self_attn/Constant_output_0/blocks.20/self_attn/Constant"Constant*C value*7B)/blocks.20/self_attn/Constant_attr::valueJ  #/blocks.20/self_attn/Shape_output_0 &/blocks.20/self_attn/Constant_output_0$/blocks.20/self_attn/Gather_output_0/blocks.20/self_attn/Gather"Gather* axis x */blocks.20/input_layernorm/Cast_2_output_0%/blocks.20/self_attn/Shape_1_output_0/blocks.20/self_attn/Shape_1"Shape (/blocks.20/self_attn/Constant_1_output_0/blocks.20/self_attn/Constant_1"Constant*E value*9B+/blocks.20/self_attn/Constant_1_attr::valueJ  %/blocks.20/self_attn/Shape_1_output_0 (/blocks.20/self_attn/Constant_1_output_0&/blocks.20/self_attn/Gather_1_output_0/blocks.20/self_attn/Gather_1"Gather* axis  */blocks.20/input_layernorm/Cast_2_output_0 onnx::MatMul_9125+/blocks.20/self_attn/q_proj/MatMul_output_0"/blocks.20/self_attn/q_proj/MatMul"MatMul  */blocks.20/input_layernorm/Cast_2_output_0 onnx::MatMul_9126+/blocks.20/self_attn/k_proj/MatMul_output_0"/blocks.20/self_attn/k_proj/MatMul"MatMul  */blocks.20/input_layernorm/Cast_2_output_0 onnx::MatMul_9127+/blocks.20/self_attn/v_proj/MatMul_output_0"/blocks.20/self_attn/v_proj/MatMul"MatMul fonnx::Unsqueeze_6187 Constant_7809"Constant*5 value*)BConstant_7809_attr::valueJ  $/blocks.20/self_attn/Gather_output_0 onnx::Unsqueeze_6187'/blocks.20/self_attn/Unsqueeze_output_0/blocks.20/self_attn/Unsqueeze" Unsqueeze fonnx::Unsqueeze_6189 Constant_7811"Constant*5 value*)BConstant_7811_attr::valueJ  &/blocks.20/self_attn/Gather_1_output_0 onnx::Unsqueeze_6189)/blocks.20/self_attn/Unsqueeze_1_output_0 /blocks.20/self_attn/Unsqueeze_1" Unsqueeze (/blocks.20/self_attn/Constant_2_output_0/blocks.20/self_attn/Constant_2"Constant*G value*;B+/blocks.20/self_attn/Constant_2_attr::valueJ (/blocks.20/self_attn/Constant_3_output_0/blocks.20/self_attn/Constant_3"Constant*G value*;B+/blocks.20/self_attn/Constant_3_attr::valueJ  '/blocks.20/self_attn/Unsqueeze_output_0 )/blocks.20/self_attn/Unsqueeze_1_output_0 (/blocks.20/self_attn/Constant_2_output_0 (/blocks.20/self_attn/Constant_3_output_0$/blocks.20/self_attn/Concat_output_0/blocks.20/self_attn/Concat"Concat* axis  +/blocks.20/self_attn/q_proj/MatMul_output_0 $/blocks.20/self_attn/Concat_output_0%/blocks.20/self_attn/Reshape_output_0/blocks.20/self_attn/Reshape"Reshape* allowzero fonnx::Unsqueeze_6197 Constant_7817"Constant*5 value*)BConstant_7817_attr::valueJ  $/blocks.20/self_attn/Gather_output_0 onnx::Unsqueeze_6197)/blocks.20/self_attn/Unsqueeze_2_output_0 /blocks.20/self_attn/Unsqueeze_2" Unsqueeze fonnx::Unsqueeze_6199 Constant_7819"Constant*5 value*)BConstant_7819_attr::valueJ  &/blocks.20/self_attn/Gather_1_output_0 onnx::Unsqueeze_6199)/blocks.20/self_attn/Unsqueeze_3_output_0 /blocks.20/self_attn/Unsqueeze_3" Unsqueeze (/blocks.20/self_attn/Constant_4_output_0/blocks.20/self_attn/Constant_4"Constant*G value*;B+/blocks.20/self_attn/Constant_4_attr::valueJ (/blocks.20/self_attn/Constant_5_output_0/blocks.20/self_attn/Constant_5"Constant*G value*;B+/blocks.20/self_attn/Constant_5_attr::valueJ  )/blocks.20/self_attn/Unsqueeze_2_output_0 )/blocks.20/self_attn/Unsqueeze_3_output_0 (/blocks.20/self_attn/Constant_4_output_0 (/blocks.20/self_attn/Constant_5_output_0&/blocks.20/self_attn/Concat_1_output_0/blocks.20/self_attn/Concat_1"Concat* axis fonnx::Unsqueeze_6206 Constant_7824"Constant*5 value*)BConstant_7824_attr::valueJ  $/blocks.20/self_attn/Gather_output_0 onnx::Unsqueeze_6206)/blocks.20/self_attn/Unsqueeze_4_output_0 /blocks.20/self_attn/Unsqueeze_4" Unsqueeze fonnx::Unsqueeze_6208 Constant_7826"Constant*5 value*)BConstant_7826_attr::valueJ  &/blocks.20/self_attn/Gather_1_output_0 onnx::Unsqueeze_6208)/blocks.20/self_attn/Unsqueeze_5_output_0 /blocks.20/self_attn/Unsqueeze_5" Unsqueeze (/blocks.20/self_attn/Constant_6_output_0/blocks.20/self_attn/Constant_6"Constant*G value*;B+/blocks.20/self_attn/Constant_6_attr::valueJ (/blocks.20/self_attn/Constant_7_output_0/blocks.20/self_attn/Constant_7"Constant*G value*;B+/blocks.20/self_attn/Constant_7_attr::valueJ  )/blocks.20/self_attn/Unsqueeze_4_output_0 )/blocks.20/self_attn/Unsqueeze_5_output_0 (/blocks.20/self_attn/Constant_6_output_0 (/blocks.20/self_attn/Constant_7_output_0&/blocks.20/self_attn/Concat_2_output_0/blocks.20/self_attn/Concat_2"Concat* axis  +/blocks.20/self_attn/k_proj/MatMul_output_0 &/blocks.20/self_attn/Concat_1_output_0'/blocks.20/self_attn/Reshape_1_output_0/blocks.20/self_attn/Reshape_1"Reshape* allowzero  +/blocks.20/self_attn/v_proj/MatMul_output_0 &/blocks.20/self_attn/Concat_2_output_0'/blocks.20/self_attn/Reshape_2_output_0/blocks.20/self_attn/Reshape_2"Reshape* allowzero  %/blocks.20/self_attn/Reshape_output_0)/blocks.20/self_attn/q_norm/Cast_output_0 /blocks.20/self_attn/q_norm/Cast"Cast* to -/blocks.20/self_attn/q_norm/Constant_output_0$/blocks.20/self_attn/q_norm/Constant"Constant*F value*:B0/blocks.20/self_attn/q_norm/Constant_attr::valueJ@  )/blocks.20/self_attn/q_norm/Cast_output_0 -/blocks.20/self_attn/q_norm/Constant_output_0(/blocks.20/self_attn/q_norm/Pow_output_0/blocks.20/self_attn/q_norm/Pow"Pow  (/blocks.20/self_attn/q_norm/Pow_output_0//blocks.20/self_attn/q_norm/ReduceMean_output_0&/blocks.20/self_attn/q_norm/ReduceMean" ReduceMean* axes@* keepdims //blocks.20/self_attn/q_norm/Constant_1_output_0&/blocks.20/self_attn/q_norm/Constant_1"Constant*H value*<B2/blocks.20/self_attn/q_norm/Constant_1_attr::valueJ75  //blocks.20/self_attn/q_norm/ReduceMean_output_0 //blocks.20/self_attn/q_norm/Constant_1_output_0(/blocks.20/self_attn/q_norm/Add_output_0/blocks.20/self_attn/q_norm/Add"Add } (/blocks.20/self_attn/q_norm/Add_output_0)/blocks.20/self_attn/q_norm/Sqrt_output_0 /blocks.20/self_attn/q_norm/Sqrt"Sqrt //blocks.20/self_attn/q_norm/Constant_2_output_0&/blocks.20/self_attn/q_norm/Constant_2"Constant*H value*<B2/blocks.20/self_attn/q_norm/Constant_2_attr::valueJ?  //blocks.20/self_attn/q_norm/Constant_2_output_0 )/blocks.20/self_attn/q_norm/Sqrt_output_0(/blocks.20/self_attn/q_norm/Div_output_0/blocks.20/self_attn/q_norm/Div"Div  )/blocks.20/self_attn/q_norm/Cast_output_0+/blocks.20/self_attn/q_norm/Cast_1_output_0"/blocks.20/self_attn/q_norm/Cast_1"Cast* to  +/blocks.20/self_attn/q_norm/Cast_1_output_0 (/blocks.20/self_attn/q_norm/Div_output_0(/blocks.20/self_attn/q_norm/Mul_output_0/blocks.20/self_attn/q_norm/Mul"Mul  (/blocks.20/self_attn/q_norm/Mul_output_0 !blocks.20.self_attn.q_norm.weight*/blocks.20/self_attn/q_norm/Mul_1_output_0!/blocks.20/self_attn/q_norm/Mul_1"Mul  */blocks.20/self_attn/q_norm/Mul_1_output_0+/blocks.20/self_attn/q_norm/Cast_2_output_0"/blocks.20/self_attn/q_norm/Cast_2"Cast* to  '/blocks.20/self_attn/Reshape_1_output_0)/blocks.20/self_attn/k_norm/Cast_output_0 /blocks.20/self_attn/k_norm/Cast"Cast* to -/blocks.20/self_attn/k_norm/Constant_output_0$/blocks.20/self_attn/k_norm/Constant"Constant*F value*:B0/blocks.20/self_attn/k_norm/Constant_attr::valueJ@  )/blocks.20/self_attn/k_norm/Cast_output_0 -/blocks.20/self_attn/k_norm/Constant_output_0(/blocks.20/self_attn/k_norm/Pow_output_0/blocks.20/self_attn/k_norm/Pow"Pow  (/blocks.20/self_attn/k_norm/Pow_output_0//blocks.20/self_attn/k_norm/ReduceMean_output_0&/blocks.20/self_attn/k_norm/ReduceMean" ReduceMean* axes@* keepdims //blocks.20/self_attn/k_norm/Constant_1_output_0&/blocks.20/self_attn/k_norm/Constant_1"Constant*H value*<B2/blocks.20/self_attn/k_norm/Constant_1_attr::valueJ75  //blocks.20/self_attn/k_norm/ReduceMean_output_0 //blocks.20/self_attn/k_norm/Constant_1_output_0(/blocks.20/self_attn/k_norm/Add_output_0/blocks.20/self_attn/k_norm/Add"Add } (/blocks.20/self_attn/k_norm/Add_output_0)/blocks.20/self_attn/k_norm/Sqrt_output_0 /blocks.20/self_attn/k_norm/Sqrt"Sqrt //blocks.20/self_attn/k_norm/Constant_2_output_0&/blocks.20/self_attn/k_norm/Constant_2"Constant*H value*<B2/blocks.20/self_attn/k_norm/Constant_2_attr::valueJ?  //blocks.20/self_attn/k_norm/Constant_2_output_0 )/blocks.20/self_attn/k_norm/Sqrt_output_0(/blocks.20/self_attn/k_norm/Div_output_0/blocks.20/self_attn/k_norm/Div"Div  )/blocks.20/self_attn/k_norm/Cast_output_0+/blocks.20/self_attn/k_norm/Cast_1_output_0"/blocks.20/self_attn/k_norm/Cast_1"Cast* to  +/blocks.20/self_attn/k_norm/Cast_1_output_0 (/blocks.20/self_attn/k_norm/Div_output_0(/blocks.20/self_attn/k_norm/Mul_output_0/blocks.20/self_attn/k_norm/Mul"Mul  (/blocks.20/self_attn/k_norm/Mul_output_0 !blocks.20.self_attn.k_norm.weight*/blocks.20/self_attn/k_norm/Mul_1_output_0!/blocks.20/self_attn/k_norm/Mul_1"Mul  */blocks.20/self_attn/k_norm/Mul_1_output_0+/blocks.20/self_attn/k_norm/Cast_2_output_0"/blocks.20/self_attn/k_norm/Cast_2"Cast* to  +/blocks.20/self_attn/q_norm/Cast_2_output_0 %/blocks.0/self_attn/Gather_2_output_0!/blocks.20/self_attn/Mul_output_0/blocks.20/self_attn/Mul"Mul y +/blocks.20/self_attn/q_norm/Cast_2_output_0%/blocks.20/self_attn/Shape_2_output_0/blocks.20/self_attn/Shape_2"Shape (/blocks.20/self_attn/Constant_8_output_0/blocks.20/self_attn/Constant_8"Constant*E value*9B+/blocks.20/self_attn/Constant_8_attr::valueJ  %/blocks.20/self_attn/Shape_2_output_0 (/blocks.20/self_attn/Constant_8_output_0&/blocks.20/self_attn/Gather_2_output_0/blocks.20/self_attn/Gather_2"Gather* axis (/blocks.20/self_attn/Constant_9_output_0/blocks.20/self_attn/Constant_9"Constant*E value*9B+/blocks.20/self_attn/Constant_9_attr::valueJ  &/blocks.20/self_attn/Gather_2_output_0 (/blocks.20/self_attn/Constant_9_output_0!/blocks.20/self_attn/Div_output_0/blocks.20/self_attn/Div"Div s !/blocks.20/self_attn/Div_output_0"/blocks.20/self_attn/Cast_output_0/blocks.20/self_attn/Cast"Cast* to x "/blocks.20/self_attn/Cast_output_0$/blocks.20/self_attn/Cast_1_output_0/blocks.20/self_attn/Cast_1"Cast* to )/blocks.20/self_attn/Constant_10_output_0 /blocks.20/self_attn/Constant_10"Constant*H value*<B,/blocks.20/self_attn/Constant_10_attr::valueJ )/blocks.20/self_attn/Constant_11_output_0 /blocks.20/self_attn/Constant_11"Constant*H value*<B,/blocks.20/self_attn/Constant_11_attr::valueJ )/blocks.20/self_attn/Constant_12_output_0 /blocks.20/self_attn/Constant_12"Constant*H value*<B,/blocks.20/self_attn/Constant_12_attr::valueJ  $/blocks.20/self_attn/Cast_1_output_0 )/blocks.20/self_attn/Constant_12_output_0)/blocks.20/self_attn/Unsqueeze_6_output_0 /blocks.20/self_attn/Unsqueeze_6" Unsqueeze )/blocks.20/self_attn/Constant_13_output_0 /blocks.20/self_attn/Constant_13"Constant*H value*<B,/blocks.20/self_attn/Constant_13_attr::valueJ  +/blocks.20/self_attn/q_norm/Cast_2_output_0 )/blocks.20/self_attn/Constant_11_output_0 )/blocks.20/self_attn/Unsqueeze_6_output_0 )/blocks.20/self_attn/Constant_10_output_0 )/blocks.20/self_attn/Constant_13_output_0#/blocks.20/self_attn/Slice_output_0/blocks.20/self_attn/Slice"Slice )/blocks.20/self_attn/Constant_14_output_0 /blocks.20/self_attn/Constant_14"Constant*H value*<B,/blocks.20/self_attn/Constant_14_attr::valueJ )/blocks.20/self_attn/Constant_15_output_0 /blocks.20/self_attn/Constant_15"Constant*H value*<B,/blocks.20/self_attn/Constant_15_attr::valueJ  $/blocks.20/self_attn/Cast_1_output_0 )/blocks.20/self_attn/Constant_15_output_0)/blocks.20/self_attn/Unsqueeze_7_output_0 /blocks.20/self_attn/Unsqueeze_7" Unsqueeze )/blocks.20/self_attn/Constant_16_output_0 /blocks.20/self_attn/Constant_16"Constant*H value*<B,/blocks.20/self_attn/Constant_16_attr::valueJ )/blocks.20/self_attn/Constant_17_output_0 /blocks.20/self_attn/Constant_17"Constant*H value*<B,/blocks.20/self_attn/Constant_17_attr::valueJ  +/blocks.20/self_attn/q_norm/Cast_2_output_0 )/blocks.20/self_attn/Unsqueeze_7_output_0 )/blocks.20/self_attn/Constant_16_output_0 )/blocks.20/self_attn/Constant_14_output_0 )/blocks.20/self_attn/Constant_17_output_0%/blocks.20/self_attn/Slice_1_output_0/blocks.20/self_attn/Slice_1"Slice i %/blocks.20/self_attn/Slice_1_output_0!/blocks.20/self_attn/Neg_output_0/blocks.20/self_attn/Neg"Neg  !/blocks.20/self_attn/Neg_output_0 #/blocks.20/self_attn/Slice_output_0&/blocks.20/self_attn/Concat_3_output_0/blocks.20/self_attn/Concat_3"Concat* axis  &/blocks.20/self_attn/Concat_3_output_0 %/blocks.0/self_attn/Gather_3_output_0#/blocks.20/self_attn/Mul_1_output_0/blocks.20/self_attn/Mul_1"Mul  !/blocks.20/self_attn/Mul_output_0 #/blocks.20/self_attn/Mul_1_output_0!/blocks.20/self_attn/Add_output_0/blocks.20/self_attn/Add"Add  +/blocks.20/self_attn/k_norm/Cast_2_output_0 %/blocks.0/self_attn/Gather_2_output_0#/blocks.20/self_attn/Mul_2_output_0/blocks.20/self_attn/Mul_2"Mul y +/blocks.20/self_attn/k_norm/Cast_2_output_0%/blocks.20/self_attn/Shape_3_output_0/blocks.20/self_attn/Shape_3"Shape )/blocks.20/self_attn/Constant_18_output_0 /blocks.20/self_attn/Constant_18"Constant*F value*:B,/blocks.20/self_attn/Constant_18_attr::valueJ  %/blocks.20/self_attn/Shape_3_output_0 )/blocks.20/self_attn/Constant_18_output_0&/blocks.20/self_attn/Gather_3_output_0/blocks.20/self_attn/Gather_3"Gather* axis )/blocks.20/self_attn/Constant_19_output_0 /blocks.20/self_attn/Constant_19"Constant*F value*:B,/blocks.20/self_attn/Constant_19_attr::valueJ  &/blocks.20/self_attn/Gather_3_output_0 )/blocks.20/self_attn/Constant_19_output_0#/blocks.20/self_attn/Div_1_output_0/blocks.20/self_attn/Div_1"Div y #/blocks.20/self_attn/Div_1_output_0$/blocks.20/self_attn/Cast_2_output_0/blocks.20/self_attn/Cast_2"Cast* to z $/blocks.20/self_attn/Cast_2_output_0$/blocks.20/self_attn/Cast_3_output_0/blocks.20/self_attn/Cast_3"Cast* to )/blocks.20/self_attn/Constant_20_output_0 /blocks.20/self_attn/Constant_20"Constant*H value*<B,/blocks.20/self_attn/Constant_20_attr::valueJ )/blocks.20/self_attn/Constant_21_output_0 /blocks.20/self_attn/Constant_21"Constant*H value*<B,/blocks.20/self_attn/Constant_21_attr::valueJ )/blocks.20/self_attn/Constant_22_output_0 /blocks.20/self_attn/Constant_22"Constant*H value*<B,/blocks.20/self_attn/Constant_22_attr::valueJ  $/blocks.20/self_attn/Cast_3_output_0 )/blocks.20/self_attn/Constant_22_output_0)/blocks.20/self_attn/Unsqueeze_8_output_0 /blocks.20/self_attn/Unsqueeze_8" Unsqueeze )/blocks.20/self_attn/Constant_23_output_0 /blocks.20/self_attn/Constant_23"Constant*H value*<B,/blocks.20/self_attn/Constant_23_attr::valueJ  +/blocks.20/self_attn/k_norm/Cast_2_output_0 )/blocks.20/self_attn/Constant_21_output_0 )/blocks.20/self_attn/Unsqueeze_8_output_0 )/blocks.20/self_attn/Constant_20_output_0 )/blocks.20/self_attn/Constant_23_output_0%/blocks.20/self_attn/Slice_2_output_0/blocks.20/self_attn/Slice_2"Slice )/blocks.20/self_attn/Constant_24_output_0 /blocks.20/self_attn/Constant_24"Constant*H value*<B,/blocks.20/self_attn/Constant_24_attr::valueJ )/blocks.20/self_attn/Constant_25_output_0 /blocks.20/self_attn/Constant_25"Constant*H value*<B,/blocks.20/self_attn/Constant_25_attr::valueJ  $/blocks.20/self_attn/Cast_3_output_0 )/blocks.20/self_attn/Constant_25_output_0)/blocks.20/self_attn/Unsqueeze_9_output_0 /blocks.20/self_attn/Unsqueeze_9" Unsqueeze )/blocks.20/self_attn/Constant_26_output_0 /blocks.20/self_attn/Constant_26"Constant*H value*<B,/blocks.20/self_attn/Constant_26_attr::valueJ )/blocks.20/self_attn/Constant_27_output_0 /blocks.20/self_attn/Constant_27"Constant*H value*<B,/blocks.20/self_attn/Constant_27_attr::valueJ  +/blocks.20/self_attn/k_norm/Cast_2_output_0 )/blocks.20/self_attn/Unsqueeze_9_output_0 )/blocks.20/self_attn/Constant_26_output_0 )/blocks.20/self_attn/Constant_24_output_0 )/blocks.20/self_attn/Constant_27_output_0%/blocks.20/self_attn/Slice_3_output_0/blocks.20/self_attn/Slice_3"Slice m %/blocks.20/self_attn/Slice_3_output_0#/blocks.20/self_attn/Neg_1_output_0/blocks.20/self_attn/Neg_1"Neg  #/blocks.20/self_attn/Neg_1_output_0 %/blocks.20/self_attn/Slice_2_output_0&/blocks.20/self_attn/Concat_4_output_0/blocks.20/self_attn/Concat_4"Concat* axis  &/blocks.20/self_attn/Concat_4_output_0 %/blocks.0/self_attn/Gather_3_output_0#/blocks.20/self_attn/Mul_3_output_0/blocks.20/self_attn/Mul_3"Mul  #/blocks.20/self_attn/Mul_2_output_0 #/blocks.20/self_attn/Mul_3_output_0#/blocks.20/self_attn/Add_1_output_0/blocks.20/self_attn/Add_1"Add  /Gather_20_output_0 /rotary/Constant_3_output_0&/blocks.20/self_attn/Gather_4_output_0/blocks.20/self_attn/Gather_4"Gather* axis  /Gather_20_output_0 /rotary/Constant_8_output_0&/blocks.20/self_attn/Gather_5_output_0/blocks.20/self_attn/Gather_5"Gather* axis  &/blocks.20/self_attn/Gather_4_output_0 #/blocks.20/self_attn/Add_1_output_0&/blocks.20/self_attn/Concat_5_output_0/blocks.20/self_attn/Concat_5"Concat* axis  &/blocks.20/self_attn/Gather_5_output_0 '/blocks.20/self_attn/Reshape_2_output_0&/blocks.20/self_attn/Concat_6_output_0/blocks.20/self_attn/Concat_6"Concat* axis )/blocks.20/self_attn/Constant_28_output_0 /blocks.20/self_attn/Constant_28"Constant*H value*<B,/blocks.20/self_attn/Constant_28_attr::valueJ  &/blocks.20/self_attn/Concat_5_output_0 )/blocks.20/self_attn/Constant_28_output_0*/blocks.20/self_attn/Unsqueeze_10_output_0!/blocks.20/self_attn/Unsqueeze_10" Unsqueeze )/blocks.20/self_attn/Constant_29_output_0 /blocks.20/self_attn/Constant_29"Constant*H value*<B,/blocks.20/self_attn/Constant_29_attr::valueJ  &/blocks.20/self_attn/Concat_6_output_0 )/blocks.20/self_attn/Constant_29_output_0*/blocks.20/self_attn/Unsqueeze_11_output_0!/blocks.20/self_attn/Unsqueeze_11" Unsqueeze  */blocks.20/self_attn/Unsqueeze_10_output_0 */blocks.20/self_attn/Unsqueeze_11_output_0&/blocks.20/self_attn/Concat_7_output_0/blocks.20/self_attn/Concat_7"Concat* axis  !/blocks.20/self_attn/Add_output_0'/blocks.20/self_attn/Transpose_output_0/blocks.20/self_attn/Transpose" Transpose* perm@@@@  &/blocks.20/self_attn/Concat_5_output_0)/blocks.20/self_attn/Transpose_1_output_0 /blocks.20/self_attn/Transpose_1" Transpose* perm@@@@  &/blocks.20/self_attn/Concat_6_output_0)/blocks.20/self_attn/Transpose_2_output_0 /blocks.20/self_attn/Transpose_2" Transpose* perm@@@@ w )/blocks.20/self_attn/Transpose_1_output_0%/blocks.20/self_attn/Shape_4_output_0/blocks.20/self_attn/Shape_4"Shape )/blocks.20/self_attn/Constant_30_output_0 /blocks.20/self_attn/Constant_30"Constant*F value*:B,/blocks.20/self_attn/Constant_30_attr::valueJ  %/blocks.20/self_attn/Shape_4_output_0 )/blocks.20/self_attn/Constant_30_output_0&/blocks.20/self_attn/Gather_6_output_0/blocks.20/self_attn/Gather_6"Gather* axis w )/blocks.20/self_attn/Transpose_1_output_0%/blocks.20/self_attn/Shape_5_output_0/blocks.20/self_attn/Shape_5"Shape )/blocks.20/self_attn/Constant_31_output_0 /blocks.20/self_attn/Constant_31"Constant*F value*:B,/blocks.20/self_attn/Constant_31_attr::valueJ  %/blocks.20/self_attn/Shape_5_output_0 )/blocks.20/self_attn/Constant_31_output_0&/blocks.20/self_attn/Gather_7_output_0/blocks.20/self_attn/Gather_7"Gather* axis w )/blocks.20/self_attn/Transpose_1_output_0%/blocks.20/self_attn/Shape_6_output_0/blocks.20/self_attn/Shape_6"Shape )/blocks.20/self_attn/Constant_32_output_0 /blocks.20/self_attn/Constant_32"Constant*F value*:B,/blocks.20/self_attn/Constant_32_attr::valueJ  %/blocks.20/self_attn/Shape_6_output_0 )/blocks.20/self_attn/Constant_32_output_0&/blocks.20/self_attn/Gather_8_output_0/blocks.20/self_attn/Gather_8"Gather* axis w )/blocks.20/self_attn/Transpose_1_output_0%/blocks.20/self_attn/Shape_7_output_0/blocks.20/self_attn/Shape_7"Shape )/blocks.20/self_attn/Constant_33_output_0 /blocks.20/self_attn/Constant_33"Constant*F value*:B,/blocks.20/self_attn/Constant_33_attr::valueJ  %/blocks.20/self_attn/Shape_7_output_0 )/blocks.20/self_attn/Constant_33_output_0&/blocks.20/self_attn/Gather_9_output_0/blocks.20/self_attn/Gather_9"Gather* axis )/blocks.20/self_attn/Constant_34_output_0 /blocks.20/self_attn/Constant_34"Constant*H value*<B,/blocks.20/self_attn/Constant_34_attr::valueJ  )/blocks.20/self_attn/Transpose_1_output_0 )/blocks.20/self_attn/Constant_34_output_0*/blocks.20/self_attn/Unsqueeze_12_output_0!/blocks.20/self_attn/Unsqueeze_12" Unsqueeze )/blocks.20/self_attn/Constant_35_output_0 /blocks.20/self_attn/Constant_35"Constant*H value*<B,/blocks.20/self_attn/Constant_35_attr::valueJ  &/blocks.20/self_attn/Gather_6_output_0 )/blocks.20/self_attn/Constant_35_output_0*/blocks.20/self_attn/Unsqueeze_13_output_0!/blocks.20/self_attn/Unsqueeze_13" Unsqueeze )/blocks.20/self_attn/Constant_36_output_0 /blocks.20/self_attn/Constant_36"Constant*H value*<B,/blocks.20/self_attn/Constant_36_attr::valueJ  &/blocks.20/self_attn/Gather_7_output_0 )/blocks.20/self_attn/Constant_36_output_0*/blocks.20/self_attn/Unsqueeze_14_output_0!/blocks.20/self_attn/Unsqueeze_14" Unsqueeze )/blocks.20/self_attn/Constant_37_output_0 /blocks.20/self_attn/Constant_37"Constant*H value*<B,/blocks.20/self_attn/Constant_37_attr::valueJ )/blocks.20/self_attn/Constant_38_output_0 /blocks.20/self_attn/Constant_38"Constant*H value*<B,/blocks.20/self_attn/Constant_38_attr::valueJ  &/blocks.20/self_attn/Gather_8_output_0 )/blocks.20/self_attn/Constant_38_output_0*/blocks.20/self_attn/Unsqueeze_15_output_0!/blocks.20/self_attn/Unsqueeze_15" Unsqueeze )/blocks.20/self_attn/Constant_39_output_0 /blocks.20/self_attn/Constant_39"Constant*H value*<B,/blocks.20/self_attn/Constant_39_attr::valueJ  &/blocks.20/self_attn/Gather_9_output_0 )/blocks.20/self_attn/Constant_39_output_0*/blocks.20/self_attn/Unsqueeze_16_output_0!/blocks.20/self_attn/Unsqueeze_16" Unsqueeze  */blocks.20/self_attn/Unsqueeze_13_output_0 */blocks.20/self_attn/Unsqueeze_14_output_0 )/blocks.20/self_attn/Constant_37_output_0 */blocks.20/self_attn/Unsqueeze_15_output_0 */blocks.20/self_attn/Unsqueeze_16_output_0&/blocks.20/self_attn/Concat_8_output_0/blocks.20/self_attn/Concat_8"Concat* axis )/blocks.20/self_attn/Constant_40_output_0 /blocks.20/self_attn/Constant_40"Constant*H value*<B,/blocks.20/self_attn/Constant_40_attr::valueJ  &/blocks.20/self_attn/Concat_8_output_0 )/blocks.20/self_attn/Constant_40_output_0'/blocks.20/self_attn/Reshape_3_output_0/blocks.20/self_attn/Reshape_3"Reshape* allowzero u '/blocks.20/self_attn/Reshape_3_output_0%/blocks.20/self_attn/Shape_8_output_0/blocks.20/self_attn/Shape_8"Shape  %/blocks.20/self_attn/Shape_8_output_0-/blocks.20/self_attn/ConstantOfShape_output_0$/blocks.20/self_attn/ConstantOfShape"ConstantOfShape*L value*@B0/blocks.20/self_attn/ConstantOfShape_attr::valueJ )/blocks.20/self_attn/Constant_41_output_0 /blocks.20/self_attn/Constant_41"Constant*F value*:B,/blocks.20/self_attn/Constant_41_attr::valueJ  -/blocks.20/self_attn/ConstantOfShape_output_0 )/blocks.20/self_attn/Constant_41_output_0#/blocks.20/self_attn/Mul_4_output_0/blocks.20/self_attn/Mul_4"Mul  '/blocks.20/self_attn/Reshape_3_output_0 #/blocks.20/self_attn/Mul_4_output_0#/blocks.20/self_attn/Equal_output_0/blocks.20/self_attn/Equal"Equal  #/blocks.20/self_attn/Equal_output_0 -/blocks.20/self_attn/ConstantOfShape_output_0 '/blocks.20/self_attn/Reshape_3_output_0#/blocks.20/self_attn/Where_output_0/blocks.20/self_attn/Where"Where  */blocks.20/self_attn/Unsqueeze_12_output_0 #/blocks.20/self_attn/Where_output_0$/blocks.20/self_attn/Expand_output_0/blocks.20/self_attn/Expand"Expand )/blocks.20/self_attn/Constant_42_output_0 /blocks.20/self_attn/Constant_42"Constant*F value*:B,/blocks.20/self_attn/Constant_42_attr::valueJ  &/blocks.20/self_attn/Gather_7_output_0 )/blocks.20/self_attn/Constant_42_output_0#/blocks.20/self_attn/Mul_5_output_0/blocks.20/self_attn/Mul_5"Mul fonnx::Unsqueeze_6351 Constant_7954"Constant*5 value*)BConstant_7954_attr::valueJ  &/blocks.20/self_attn/Gather_6_output_0 onnx::Unsqueeze_6351*/blocks.20/self_attn/Unsqueeze_17_output_0!/blocks.20/self_attn/Unsqueeze_17" Unsqueeze fonnx::Unsqueeze_6353 Constant_7956"Constant*5 value*)BConstant_7956_attr::valueJ  #/blocks.20/self_attn/Mul_5_output_0 onnx::Unsqueeze_6353*/blocks.20/self_attn/Unsqueeze_18_output_0!/blocks.20/self_attn/Unsqueeze_18" Unsqueeze fonnx::Unsqueeze_6355 Constant_7958"Constant*5 value*)BConstant_7958_attr::valueJ  &/blocks.20/self_attn/Gather_8_output_0 onnx::Unsqueeze_6355*/blocks.20/self_attn/Unsqueeze_19_output_0!/blocks.20/self_attn/Unsqueeze_19" Unsqueeze fonnx::Unsqueeze_6357 Constant_7960"Constant*5 value*)BConstant_7960_attr::valueJ  &/blocks.20/self_attn/Gather_9_output_0 onnx::Unsqueeze_6357*/blocks.20/self_attn/Unsqueeze_20_output_0!/blocks.20/self_attn/Unsqueeze_20" Unsqueeze  */blocks.20/self_attn/Unsqueeze_17_output_0 */blocks.20/self_attn/Unsqueeze_18_output_0 */blocks.20/self_attn/Unsqueeze_19_output_0 */blocks.20/self_attn/Unsqueeze_20_output_0&/blocks.20/self_attn/Concat_9_output_0/blocks.20/self_attn/Concat_9"Concat* axis  $/blocks.20/self_attn/Expand_output_0 &/blocks.20/self_attn/Concat_9_output_0'/blocks.20/self_attn/Reshape_4_output_0/blocks.20/self_attn/Reshape_4"Reshape* allowzero w )/blocks.20/self_attn/Transpose_2_output_0%/blocks.20/self_attn/Shape_9_output_0/blocks.20/self_attn/Shape_9"Shape )/blocks.20/self_attn/Constant_43_output_0 /blocks.20/self_attn/Constant_43"Constant*F value*:B,/blocks.20/self_attn/Constant_43_attr::valueJ  %/blocks.20/self_attn/Shape_9_output_0 )/blocks.20/self_attn/Constant_43_output_0'/blocks.20/self_attn/Gather_10_output_0/blocks.20/self_attn/Gather_10"Gather* axis y )/blocks.20/self_attn/Transpose_2_output_0&/blocks.20/self_attn/Shape_10_output_0/blocks.20/self_attn/Shape_10"Shape )/blocks.20/self_attn/Constant_44_output_0 /blocks.20/self_attn/Constant_44"Constant*F value*:B,/blocks.20/self_attn/Constant_44_attr::valueJ  &/blocks.20/self_attn/Shape_10_output_0 )/blocks.20/self_attn/Constant_44_output_0'/blocks.20/self_attn/Gather_11_output_0/blocks.20/self_attn/Gather_11"Gather* axis y )/blocks.20/self_attn/Transpose_2_output_0&/blocks.20/self_attn/Shape_11_output_0/blocks.20/self_attn/Shape_11"Shape )/blocks.20/self_attn/Constant_45_output_0 /blocks.20/self_attn/Constant_45"Constant*F value*:B,/blocks.20/self_attn/Constant_45_attr::valueJ  &/blocks.20/self_attn/Shape_11_output_0 )/blocks.20/self_attn/Constant_45_output_0'/blocks.20/self_attn/Gather_12_output_0/blocks.20/self_attn/Gather_12"Gather* axis y )/blocks.20/self_attn/Transpose_2_output_0&/blocks.20/self_attn/Shape_12_output_0/blocks.20/self_attn/Shape_12"Shape )/blocks.20/self_attn/Constant_46_output_0 /blocks.20/self_attn/Constant_46"Constant*F value*:B,/blocks.20/self_attn/Constant_46_attr::valueJ  &/blocks.20/self_attn/Shape_12_output_0 )/blocks.20/self_attn/Constant_46_output_0'/blocks.20/self_attn/Gather_13_output_0/blocks.20/self_attn/Gather_13"Gather* axis )/blocks.20/self_attn/Constant_47_output_0 /blocks.20/self_attn/Constant_47"Constant*H value*<B,/blocks.20/self_attn/Constant_47_attr::valueJ  )/blocks.20/self_attn/Transpose_2_output_0 )/blocks.20/self_attn/Constant_47_output_0*/blocks.20/self_attn/Unsqueeze_21_output_0!/blocks.20/self_attn/Unsqueeze_21" Unsqueeze )/blocks.20/self_attn/Constant_48_output_0 /blocks.20/self_attn/Constant_48"Constant*H value*<B,/blocks.20/self_attn/Constant_48_attr::valueJ  '/blocks.20/self_attn/Gather_10_output_0 )/blocks.20/self_attn/Constant_48_output_0*/blocks.20/self_attn/Unsqueeze_22_output_0!/blocks.20/self_attn/Unsqueeze_22" Unsqueeze )/blocks.20/self_attn/Constant_49_output_0 /blocks.20/self_attn/Constant_49"Constant*H value*<B,/blocks.20/self_attn/Constant_49_attr::valueJ  '/blocks.20/self_attn/Gather_11_output_0 )/blocks.20/self_attn/Constant_49_output_0*/blocks.20/self_attn/Unsqueeze_23_output_0!/blocks.20/self_attn/Unsqueeze_23" Unsqueeze )/blocks.20/self_attn/Constant_50_output_0 /blocks.20/self_attn/Constant_50"Constant*H value*<B,/blocks.20/self_attn/Constant_50_attr::valueJ )/blocks.20/self_attn/Constant_51_output_0 /blocks.20/self_attn/Constant_51"Constant*H value*<B,/blocks.20/self_attn/Constant_51_attr::valueJ  '/blocks.20/self_attn/Gather_12_output_0 )/blocks.20/self_attn/Constant_51_output_0*/blocks.20/self_attn/Unsqueeze_24_output_0!/blocks.20/self_attn/Unsqueeze_24" Unsqueeze )/blocks.20/self_attn/Constant_52_output_0 /blocks.20/self_attn/Constant_52"Constant*H value*<B,/blocks.20/self_attn/Constant_52_attr::valueJ  '/blocks.20/self_attn/Gather_13_output_0 )/blocks.20/self_attn/Constant_52_output_0*/blocks.20/self_attn/Unsqueeze_25_output_0!/blocks.20/self_attn/Unsqueeze_25" Unsqueeze  */blocks.20/self_attn/Unsqueeze_22_output_0 */blocks.20/self_attn/Unsqueeze_23_output_0 )/blocks.20/self_attn/Constant_50_output_0 */blocks.20/self_attn/Unsqueeze_24_output_0 */blocks.20/self_attn/Unsqueeze_25_output_0'/blocks.20/self_attn/Concat_10_output_0/blocks.20/self_attn/Concat_10"Concat* axis )/blocks.20/self_attn/Constant_53_output_0 /blocks.20/self_attn/Constant_53"Constant*H value*<B,/blocks.20/self_attn/Constant_53_attr::valueJ  '/blocks.20/self_attn/Concat_10_output_0 )/blocks.20/self_attn/Constant_53_output_0'/blocks.20/self_attn/Reshape_5_output_0/blocks.20/self_attn/Reshape_5"Reshape* allowzero w '/blocks.20/self_attn/Reshape_5_output_0&/blocks.20/self_attn/Shape_13_output_0/blocks.20/self_attn/Shape_13"Shape  &/blocks.20/self_attn/Shape_13_output_0//blocks.20/self_attn/ConstantOfShape_1_output_0&/blocks.20/self_attn/ConstantOfShape_1"ConstantOfShape*N value*BB2/blocks.20/self_attn/ConstantOfShape_1_attr::valueJ )/blocks.20/self_attn/Constant_54_output_0 /blocks.20/self_attn/Constant_54"Constant*F value*:B,/blocks.20/self_attn/Constant_54_attr::valueJ  //blocks.20/self_attn/ConstantOfShape_1_output_0 )/blocks.20/self_attn/Constant_54_output_0#/blocks.20/self_attn/Mul_6_output_0/blocks.20/self_attn/Mul_6"Mul  '/blocks.20/self_attn/Reshape_5_output_0 #/blocks.20/self_attn/Mul_6_output_0%/blocks.20/self_attn/Equal_1_output_0/blocks.20/self_attn/Equal_1"Equal  %/blocks.20/self_attn/Equal_1_output_0 //blocks.20/self_attn/ConstantOfShape_1_output_0 '/blocks.20/self_attn/Reshape_5_output_0%/blocks.20/self_attn/Where_1_output_0/blocks.20/self_attn/Where_1"Where  */blocks.20/self_attn/Unsqueeze_21_output_0 %/blocks.20/self_attn/Where_1_output_0&/blocks.20/self_attn/Expand_1_output_0/blocks.20/self_attn/Expand_1"Expand )/blocks.20/self_attn/Constant_55_output_0 /blocks.20/self_attn/Constant_55"Constant*F value*:B,/blocks.20/self_attn/Constant_55_attr::valueJ  '/blocks.20/self_attn/Gather_11_output_0 )/blocks.20/self_attn/Constant_55_output_0#/blocks.20/self_attn/Mul_7_output_0/blocks.20/self_attn/Mul_7"Mul fonnx::Unsqueeze_6397 Constant_7999"Constant*5 value*)BConstant_7999_attr::valueJ  '/blocks.20/self_attn/Gather_10_output_0 onnx::Unsqueeze_6397*/blocks.20/self_attn/Unsqueeze_26_output_0!/blocks.20/self_attn/Unsqueeze_26" Unsqueeze fonnx::Unsqueeze_6399 Constant_8001"Constant*5 value*)BConstant_8001_attr::valueJ  #/blocks.20/self_attn/Mul_7_output_0 onnx::Unsqueeze_6399*/blocks.20/self_attn/Unsqueeze_27_output_0!/blocks.20/self_attn/Unsqueeze_27" Unsqueeze fonnx::Unsqueeze_6401 Constant_8003"Constant*5 value*)BConstant_8003_attr::valueJ  '/blocks.20/self_attn/Gather_12_output_0 onnx::Unsqueeze_6401*/blocks.20/self_attn/Unsqueeze_28_output_0!/blocks.20/self_attn/Unsqueeze_28" Unsqueeze fonnx::Unsqueeze_6403 Constant_8005"Constant*5 value*)BConstant_8005_attr::valueJ  '/blocks.20/self_attn/Gather_13_output_0 onnx::Unsqueeze_6403*/blocks.20/self_attn/Unsqueeze_29_output_0!/blocks.20/self_attn/Unsqueeze_29" Unsqueeze  */blocks.20/self_attn/Unsqueeze_26_output_0 */blocks.20/self_attn/Unsqueeze_27_output_0 */blocks.20/self_attn/Unsqueeze_28_output_0 */blocks.20/self_attn/Unsqueeze_29_output_0'/blocks.20/self_attn/Concat_11_output_0/blocks.20/self_attn/Concat_11"Concat* axis  &/blocks.20/self_attn/Expand_1_output_0 '/blocks.20/self_attn/Concat_11_output_0'/blocks.20/self_attn/Reshape_6_output_0/blocks.20/self_attn/Reshape_6"Reshape* allowzero  '/blocks.20/self_attn/Transpose_output_0 '/blocks.20/self_attn/Reshape_4_output_0$/blocks.20/self_attn/MatMul_output_0/blocks.20/self_attn/MatMul"MatMul )/blocks.20/self_attn/Constant_56_output_0 /blocks.20/self_attn/Constant_56"Constant*B value*6B,/blocks.20/self_attn/Constant_56_attr::valueJ5A  $/blocks.20/self_attn/MatMul_output_0 )/blocks.20/self_attn/Constant_56_output_0#/blocks.20/self_attn/Div_2_output_0/blocks.20/self_attn/Div_2"Div { #/blocks.20/self_attn/Div_2_output_0 attention_mask#/blocks.20/self_attn/Add_2_output_0/blocks.20/self_attn/Add_2"Add  #/blocks.20/self_attn/Add_2_output_0%/blocks.20/self_attn/Softmax_output_0/blocks.20/self_attn/Softmax"Softmax* axis { %/blocks.20/self_attn/Softmax_output_0$/blocks.20/self_attn/Cast_4_output_0/blocks.20/self_attn/Cast_4"Cast* to  $/blocks.20/self_attn/Cast_4_output_0 '/blocks.20/self_attn/Reshape_6_output_0&/blocks.20/self_attn/MatMul_1_output_0/blocks.20/self_attn/MatMul_1"MatMul  &/blocks.20/self_attn/MatMul_1_output_0)/blocks.20/self_attn/Transpose_3_output_0 /blocks.20/self_attn/Transpose_3" Transpose* perm@@@@ fonnx::Unsqueeze_6415 Constant_8017"Constant*5 value*)BConstant_8017_attr::valueJ  $/blocks.20/self_attn/Gather_output_0 onnx::Unsqueeze_6415*/blocks.20/self_attn/Unsqueeze_30_output_0!/blocks.20/self_attn/Unsqueeze_30" Unsqueeze fonnx::Unsqueeze_6417 Constant_8019"Constant*5 value*)BConstant_8019_attr::valueJ  &/blocks.20/self_attn/Gather_1_output_0 onnx::Unsqueeze_6417*/blocks.20/self_attn/Unsqueeze_31_output_0!/blocks.20/self_attn/Unsqueeze_31" Unsqueeze )/blocks.20/self_attn/Constant_57_output_0 /blocks.20/self_attn/Constant_57"Constant*H value*<B,/blocks.20/self_attn/Constant_57_attr::valueJ  */blocks.20/self_attn/Unsqueeze_30_output_0 */blocks.20/self_attn/Unsqueeze_31_output_0 )/blocks.20/self_attn/Constant_57_output_0'/blocks.20/self_attn/Concat_12_output_0/blocks.20/self_attn/Concat_12"Concat* axis  )/blocks.20/self_attn/Transpose_3_output_0 '/blocks.20/self_attn/Concat_12_output_0'/blocks.20/self_attn/Reshape_7_output_0/blocks.20/self_attn/Reshape_7"Reshape* allowzero  '/blocks.20/self_attn/Reshape_7_output_0 onnx::MatMul_9149+/blocks.20/self_attn/o_proj/MatMul_output_0"/blocks.20/self_attn/o_proj/MatMul"MatMul  */blocks.20/input_layernorm/Cast_1_output_0 +/blocks.20/self_attn/o_proj/MatMul_output_0/blocks.20/Add_output_0/blocks.20/Add"Add  /blocks.20/Add_output_01/blocks.20/post_attention_layernorm/Cast_output_0(/blocks.20/post_attention_layernorm/Cast"Cast* to 5/blocks.20/post_attention_layernorm/Constant_output_0,/blocks.20/post_attention_layernorm/Constant"Constant*N value*BB8/blocks.20/post_attention_layernorm/Constant_attr::valueJ@  1/blocks.20/post_attention_layernorm/Cast_output_0 5/blocks.20/post_attention_layernorm/Constant_output_00/blocks.20/post_attention_layernorm/Pow_output_0'/blocks.20/post_attention_layernorm/Pow"Pow  0/blocks.20/post_attention_layernorm/Pow_output_07/blocks.20/post_attention_layernorm/ReduceMean_output_0./blocks.20/post_attention_layernorm/ReduceMean" ReduceMean* axes@* keepdims 7/blocks.20/post_attention_layernorm/Constant_1_output_0./blocks.20/post_attention_layernorm/Constant_1"Constant*P value*DB:/blocks.20/post_attention_layernorm/Constant_1_attr::valueJ75  7/blocks.20/post_attention_layernorm/ReduceMean_output_0 7/blocks.20/post_attention_layernorm/Constant_1_output_00/blocks.20/post_attention_layernorm/Add_output_0'/blocks.20/post_attention_layernorm/Add"Add  0/blocks.20/post_attention_layernorm/Add_output_01/blocks.20/post_attention_layernorm/Sqrt_output_0(/blocks.20/post_attention_layernorm/Sqrt"Sqrt 7/blocks.20/post_attention_layernorm/Constant_2_output_0./blocks.20/post_attention_layernorm/Constant_2"Constant*P value*DB:/blocks.20/post_attention_layernorm/Constant_2_attr::valueJ?  7/blocks.20/post_attention_layernorm/Constant_2_output_0 1/blocks.20/post_attention_layernorm/Sqrt_output_00/blocks.20/post_attention_layernorm/Div_output_0'/blocks.20/post_attention_layernorm/Div"Div  1/blocks.20/post_attention_layernorm/Cast_output_03/blocks.20/post_attention_layernorm/Cast_1_output_0*/blocks.20/post_attention_layernorm/Cast_1"Cast* to  3/blocks.20/post_attention_layernorm/Cast_1_output_0 0/blocks.20/post_attention_layernorm/Div_output_00/blocks.20/post_attention_layernorm/Mul_output_0'/blocks.20/post_attention_layernorm/Mul"Mul  0/blocks.20/post_attention_layernorm/Mul_output_0 )blocks.20.post_attention_layernorm.weight2/blocks.20/post_attention_layernorm/Mul_1_output_0)/blocks.20/post_attention_layernorm/Mul_1"Mul  2/blocks.20/post_attention_layernorm/Mul_1_output_03/blocks.20/post_attention_layernorm/Cast_2_output_0*/blocks.20/post_attention_layernorm/Cast_2"Cast* to  3/blocks.20/post_attention_layernorm/Cast_2_output_0 onnx::MatMul_9150(/blocks.20/mlp/gate_proj/MatMul_output_0/blocks.20/mlp/gate_proj/MatMul"MatMul z (/blocks.20/mlp/gate_proj/MatMul_output_0&/blocks.20/mlp/act_fn/Sigmoid_output_0/blocks.20/mlp/act_fn/Sigmoid"Sigmoid  (/blocks.20/mlp/gate_proj/MatMul_output_0 &/blocks.20/mlp/act_fn/Sigmoid_output_0"/blocks.20/mlp/act_fn/Mul_output_0/blocks.20/mlp/act_fn/Mul"Mul  3/blocks.20/post_attention_layernorm/Cast_2_output_0 onnx::MatMul_9151&/blocks.20/mlp/up_proj/MatMul_output_0/blocks.20/mlp/up_proj/MatMul"MatMul  "/blocks.20/mlp/act_fn/Mul_output_0 &/blocks.20/mlp/up_proj/MatMul_output_0/blocks.20/mlp/Mul_output_0/blocks.20/mlp/Mul"Mul  /blocks.20/mlp/Mul_output_0 onnx::MatMul_9152(/blocks.20/mlp/down_proj/MatMul_output_0/blocks.20/mlp/down_proj/MatMul"MatMul  3/blocks.20/post_attention_layernorm/Cast_1_output_0 (/blocks.20/mlp/down_proj/MatMul_output_0/blocks.20/Add_1_output_0/blocks.20/Add_1"Add c/Constant_13_output_0 /Constant_13"Constant*2 value*&B/Constant_13_attr::valueJ ^ past_key_values /Constant_13_output_0/Gather_21_output_0 /Gather_21"Gather* axis /blocks.21/Constant_output_0/blocks.21/Constant"Constant*K value*?B/blocks.21/Constant_attr::valueJ  /blocks.20/Add_1_output_0 /blocks.21/Constant_output_0/blocks.21/Reshape_output_0/blocks.21/Reshape"Reshape* allowzero y /blocks.21/Reshape_output_0(/blocks.21/input_layernorm/Cast_output_0/blocks.21/input_layernorm/Cast"Cast* to ,/blocks.21/input_layernorm/Constant_output_0#/blocks.21/input_layernorm/Constant"Constant*E value*9B//blocks.21/input_layernorm/Constant_attr::valueJ@  (/blocks.21/input_layernorm/Cast_output_0 ,/blocks.21/input_layernorm/Constant_output_0'/blocks.21/input_layernorm/Pow_output_0/blocks.21/input_layernorm/Pow"Pow  '/blocks.21/input_layernorm/Pow_output_0./blocks.21/input_layernorm/ReduceMean_output_0%/blocks.21/input_layernorm/ReduceMean" ReduceMean* axes@* keepdims ./blocks.21/input_layernorm/Constant_1_output_0%/blocks.21/input_layernorm/Constant_1"Constant*G value*;B1/blocks.21/input_layernorm/Constant_1_attr::valueJ75  ./blocks.21/input_layernorm/ReduceMean_output_0 ./blocks.21/input_layernorm/Constant_1_output_0'/blocks.21/input_layernorm/Add_output_0/blocks.21/input_layernorm/Add"Add z '/blocks.21/input_layernorm/Add_output_0(/blocks.21/input_layernorm/Sqrt_output_0/blocks.21/input_layernorm/Sqrt"Sqrt ./blocks.21/input_layernorm/Constant_2_output_0%/blocks.21/input_layernorm/Constant_2"Constant*G value*;B1/blocks.21/input_layernorm/Constant_2_attr::valueJ?  ./blocks.21/input_layernorm/Constant_2_output_0 (/blocks.21/input_layernorm/Sqrt_output_0'/blocks.21/input_layernorm/Div_output_0/blocks.21/input_layernorm/Div"Div  (/blocks.21/input_layernorm/Cast_output_0*/blocks.21/input_layernorm/Cast_1_output_0!/blocks.21/input_layernorm/Cast_1"Cast* to  */blocks.21/input_layernorm/Cast_1_output_0 '/blocks.21/input_layernorm/Div_output_0'/blocks.21/input_layernorm/Mul_output_0/blocks.21/input_layernorm/Mul"Mul  '/blocks.21/input_layernorm/Mul_output_0 blocks.21.input_layernorm.weight)/blocks.21/input_layernorm/Mul_1_output_0 /blocks.21/input_layernorm/Mul_1"Mul  )/blocks.21/input_layernorm/Mul_1_output_0*/blocks.21/input_layernorm/Cast_2_output_0!/blocks.21/input_layernorm/Cast_2"Cast* to t */blocks.21/input_layernorm/Cast_2_output_0#/blocks.21/self_attn/Shape_output_0/blocks.21/self_attn/Shape"Shape &/blocks.21/self_attn/Constant_output_0/blocks.21/self_attn/Constant"Constant*C value*7B)/blocks.21/self_attn/Constant_attr::valueJ  #/blocks.21/self_attn/Shape_output_0 &/blocks.21/self_attn/Constant_output_0$/blocks.21/self_attn/Gather_output_0/blocks.21/self_attn/Gather"Gather* axis x */blocks.21/input_layernorm/Cast_2_output_0%/blocks.21/self_attn/Shape_1_output_0/blocks.21/self_attn/Shape_1"Shape (/blocks.21/self_attn/Constant_1_output_0/blocks.21/self_attn/Constant_1"Constant*E value*9B+/blocks.21/self_attn/Constant_1_attr::valueJ  %/blocks.21/self_attn/Shape_1_output_0 (/blocks.21/self_attn/Constant_1_output_0&/blocks.21/self_attn/Gather_1_output_0/blocks.21/self_attn/Gather_1"Gather* axis  */blocks.21/input_layernorm/Cast_2_output_0 onnx::MatMul_9153+/blocks.21/self_attn/q_proj/MatMul_output_0"/blocks.21/self_attn/q_proj/MatMul"MatMul  */blocks.21/input_layernorm/Cast_2_output_0 onnx::MatMul_9154+/blocks.21/self_attn/k_proj/MatMul_output_0"/blocks.21/self_attn/k_proj/MatMul"MatMul  */blocks.21/input_layernorm/Cast_2_output_0 onnx::MatMul_9155+/blocks.21/self_attn/v_proj/MatMul_output_0"/blocks.21/self_attn/v_proj/MatMul"MatMul fonnx::Unsqueeze_6478 Constant_8072"Constant*5 value*)BConstant_8072_attr::valueJ  $/blocks.21/self_attn/Gather_output_0 onnx::Unsqueeze_6478'/blocks.21/self_attn/Unsqueeze_output_0/blocks.21/self_attn/Unsqueeze" Unsqueeze fonnx::Unsqueeze_6480 Constant_8074"Constant*5 value*)BConstant_8074_attr::valueJ  &/blocks.21/self_attn/Gather_1_output_0 onnx::Unsqueeze_6480)/blocks.21/self_attn/Unsqueeze_1_output_0 /blocks.21/self_attn/Unsqueeze_1" Unsqueeze (/blocks.21/self_attn/Constant_2_output_0/blocks.21/self_attn/Constant_2"Constant*G value*;B+/blocks.21/self_attn/Constant_2_attr::valueJ (/blocks.21/self_attn/Constant_3_output_0/blocks.21/self_attn/Constant_3"Constant*G value*;B+/blocks.21/self_attn/Constant_3_attr::valueJ  '/blocks.21/self_attn/Unsqueeze_output_0 )/blocks.21/self_attn/Unsqueeze_1_output_0 (/blocks.21/self_attn/Constant_2_output_0 (/blocks.21/self_attn/Constant_3_output_0$/blocks.21/self_attn/Concat_output_0/blocks.21/self_attn/Concat"Concat* axis  +/blocks.21/self_attn/q_proj/MatMul_output_0 $/blocks.21/self_attn/Concat_output_0%/blocks.21/self_attn/Reshape_output_0/blocks.21/self_attn/Reshape"Reshape* allowzero fonnx::Unsqueeze_6488 Constant_8080"Constant*5 value*)BConstant_8080_attr::valueJ  $/blocks.21/self_attn/Gather_output_0 onnx::Unsqueeze_6488)/blocks.21/self_attn/Unsqueeze_2_output_0 /blocks.21/self_attn/Unsqueeze_2" Unsqueeze fonnx::Unsqueeze_6490 Constant_8082"Constant*5 value*)BConstant_8082_attr::valueJ  &/blocks.21/self_attn/Gather_1_output_0 onnx::Unsqueeze_6490)/blocks.21/self_attn/Unsqueeze_3_output_0 /blocks.21/self_attn/Unsqueeze_3" Unsqueeze (/blocks.21/self_attn/Constant_4_output_0/blocks.21/self_attn/Constant_4"Constant*G value*;B+/blocks.21/self_attn/Constant_4_attr::valueJ (/blocks.21/self_attn/Constant_5_output_0/blocks.21/self_attn/Constant_5"Constant*G value*;B+/blocks.21/self_attn/Constant_5_attr::valueJ  )/blocks.21/self_attn/Unsqueeze_2_output_0 )/blocks.21/self_attn/Unsqueeze_3_output_0 (/blocks.21/self_attn/Constant_4_output_0 (/blocks.21/self_attn/Constant_5_output_0&/blocks.21/self_attn/Concat_1_output_0/blocks.21/self_attn/Concat_1"Concat* axis fonnx::Unsqueeze_6497 Constant_8087"Constant*5 value*)BConstant_8087_attr::valueJ  $/blocks.21/self_attn/Gather_output_0 onnx::Unsqueeze_6497)/blocks.21/self_attn/Unsqueeze_4_output_0 /blocks.21/self_attn/Unsqueeze_4" Unsqueeze fonnx::Unsqueeze_6499 Constant_8089"Constant*5 value*)BConstant_8089_attr::valueJ  &/blocks.21/self_attn/Gather_1_output_0 onnx::Unsqueeze_6499)/blocks.21/self_attn/Unsqueeze_5_output_0 /blocks.21/self_attn/Unsqueeze_5" Unsqueeze (/blocks.21/self_attn/Constant_6_output_0/blocks.21/self_attn/Constant_6"Constant*G value*;B+/blocks.21/self_attn/Constant_6_attr::valueJ (/blocks.21/self_attn/Constant_7_output_0/blocks.21/self_attn/Constant_7"Constant*G value*;B+/blocks.21/self_attn/Constant_7_attr::valueJ  )/blocks.21/self_attn/Unsqueeze_4_output_0 )/blocks.21/self_attn/Unsqueeze_5_output_0 (/blocks.21/self_attn/Constant_6_output_0 (/blocks.21/self_attn/Constant_7_output_0&/blocks.21/self_attn/Concat_2_output_0/blocks.21/self_attn/Concat_2"Concat* axis  +/blocks.21/self_attn/k_proj/MatMul_output_0 &/blocks.21/self_attn/Concat_1_output_0'/blocks.21/self_attn/Reshape_1_output_0/blocks.21/self_attn/Reshape_1"Reshape* allowzero  +/blocks.21/self_attn/v_proj/MatMul_output_0 &/blocks.21/self_attn/Concat_2_output_0'/blocks.21/self_attn/Reshape_2_output_0/blocks.21/self_attn/Reshape_2"Reshape* allowzero  %/blocks.21/self_attn/Reshape_output_0)/blocks.21/self_attn/q_norm/Cast_output_0 /blocks.21/self_attn/q_norm/Cast"Cast* to -/blocks.21/self_attn/q_norm/Constant_output_0$/blocks.21/self_attn/q_norm/Constant"Constant*F value*:B0/blocks.21/self_attn/q_norm/Constant_attr::valueJ@  )/blocks.21/self_attn/q_norm/Cast_output_0 -/blocks.21/self_attn/q_norm/Constant_output_0(/blocks.21/self_attn/q_norm/Pow_output_0/blocks.21/self_attn/q_norm/Pow"Pow  (/blocks.21/self_attn/q_norm/Pow_output_0//blocks.21/self_attn/q_norm/ReduceMean_output_0&/blocks.21/self_attn/q_norm/ReduceMean" ReduceMean* axes@* keepdims //blocks.21/self_attn/q_norm/Constant_1_output_0&/blocks.21/self_attn/q_norm/Constant_1"Constant*H value*<B2/blocks.21/self_attn/q_norm/Constant_1_attr::valueJ75  //blocks.21/self_attn/q_norm/ReduceMean_output_0 //blocks.21/self_attn/q_norm/Constant_1_output_0(/blocks.21/self_attn/q_norm/Add_output_0/blocks.21/self_attn/q_norm/Add"Add } (/blocks.21/self_attn/q_norm/Add_output_0)/blocks.21/self_attn/q_norm/Sqrt_output_0 /blocks.21/self_attn/q_norm/Sqrt"Sqrt //blocks.21/self_attn/q_norm/Constant_2_output_0&/blocks.21/self_attn/q_norm/Constant_2"Constant*H value*<B2/blocks.21/self_attn/q_norm/Constant_2_attr::valueJ?  //blocks.21/self_attn/q_norm/Constant_2_output_0 )/blocks.21/self_attn/q_norm/Sqrt_output_0(/blocks.21/self_attn/q_norm/Div_output_0/blocks.21/self_attn/q_norm/Div"Div  )/blocks.21/self_attn/q_norm/Cast_output_0+/blocks.21/self_attn/q_norm/Cast_1_output_0"/blocks.21/self_attn/q_norm/Cast_1"Cast* to  +/blocks.21/self_attn/q_norm/Cast_1_output_0 (/blocks.21/self_attn/q_norm/Div_output_0(/blocks.21/self_attn/q_norm/Mul_output_0/blocks.21/self_attn/q_norm/Mul"Mul  (/blocks.21/self_attn/q_norm/Mul_output_0 !blocks.21.self_attn.q_norm.weight*/blocks.21/self_attn/q_norm/Mul_1_output_0!/blocks.21/self_attn/q_norm/Mul_1"Mul  */blocks.21/self_attn/q_norm/Mul_1_output_0+/blocks.21/self_attn/q_norm/Cast_2_output_0"/blocks.21/self_attn/q_norm/Cast_2"Cast* to  '/blocks.21/self_attn/Reshape_1_output_0)/blocks.21/self_attn/k_norm/Cast_output_0 /blocks.21/self_attn/k_norm/Cast"Cast* to -/blocks.21/self_attn/k_norm/Constant_output_0$/blocks.21/self_attn/k_norm/Constant"Constant*F value*:B0/blocks.21/self_attn/k_norm/Constant_attr::valueJ@  )/blocks.21/self_attn/k_norm/Cast_output_0 -/blocks.21/self_attn/k_norm/Constant_output_0(/blocks.21/self_attn/k_norm/Pow_output_0/blocks.21/self_attn/k_norm/Pow"Pow  (/blocks.21/self_attn/k_norm/Pow_output_0//blocks.21/self_attn/k_norm/ReduceMean_output_0&/blocks.21/self_attn/k_norm/ReduceMean" ReduceMean* axes@* keepdims //blocks.21/self_attn/k_norm/Constant_1_output_0&/blocks.21/self_attn/k_norm/Constant_1"Constant*H value*<B2/blocks.21/self_attn/k_norm/Constant_1_attr::valueJ75  //blocks.21/self_attn/k_norm/ReduceMean_output_0 //blocks.21/self_attn/k_norm/Constant_1_output_0(/blocks.21/self_attn/k_norm/Add_output_0/blocks.21/self_attn/k_norm/Add"Add } (/blocks.21/self_attn/k_norm/Add_output_0)/blocks.21/self_attn/k_norm/Sqrt_output_0 /blocks.21/self_attn/k_norm/Sqrt"Sqrt //blocks.21/self_attn/k_norm/Constant_2_output_0&/blocks.21/self_attn/k_norm/Constant_2"Constant*H value*<B2/blocks.21/self_attn/k_norm/Constant_2_attr::valueJ?  //blocks.21/self_attn/k_norm/Constant_2_output_0 )/blocks.21/self_attn/k_norm/Sqrt_output_0(/blocks.21/self_attn/k_norm/Div_output_0/blocks.21/self_attn/k_norm/Div"Div  )/blocks.21/self_attn/k_norm/Cast_output_0+/blocks.21/self_attn/k_norm/Cast_1_output_0"/blocks.21/self_attn/k_norm/Cast_1"Cast* to  +/blocks.21/self_attn/k_norm/Cast_1_output_0 (/blocks.21/self_attn/k_norm/Div_output_0(/blocks.21/self_attn/k_norm/Mul_output_0/blocks.21/self_attn/k_norm/Mul"Mul  (/blocks.21/self_attn/k_norm/Mul_output_0 !blocks.21.self_attn.k_norm.weight*/blocks.21/self_attn/k_norm/Mul_1_output_0!/blocks.21/self_attn/k_norm/Mul_1"Mul  */blocks.21/self_attn/k_norm/Mul_1_output_0+/blocks.21/self_attn/k_norm/Cast_2_output_0"/blocks.21/self_attn/k_norm/Cast_2"Cast* to  +/blocks.21/self_attn/q_norm/Cast_2_output_0 %/blocks.0/self_attn/Gather_2_output_0!/blocks.21/self_attn/Mul_output_0/blocks.21/self_attn/Mul"Mul y +/blocks.21/self_attn/q_norm/Cast_2_output_0%/blocks.21/self_attn/Shape_2_output_0/blocks.21/self_attn/Shape_2"Shape (/blocks.21/self_attn/Constant_8_output_0/blocks.21/self_attn/Constant_8"Constant*E value*9B+/blocks.21/self_attn/Constant_8_attr::valueJ  %/blocks.21/self_attn/Shape_2_output_0 (/blocks.21/self_attn/Constant_8_output_0&/blocks.21/self_attn/Gather_2_output_0/blocks.21/self_attn/Gather_2"Gather* axis (/blocks.21/self_attn/Constant_9_output_0/blocks.21/self_attn/Constant_9"Constant*E value*9B+/blocks.21/self_attn/Constant_9_attr::valueJ  &/blocks.21/self_attn/Gather_2_output_0 (/blocks.21/self_attn/Constant_9_output_0!/blocks.21/self_attn/Div_output_0/blocks.21/self_attn/Div"Div s !/blocks.21/self_attn/Div_output_0"/blocks.21/self_attn/Cast_output_0/blocks.21/self_attn/Cast"Cast* to x "/blocks.21/self_attn/Cast_output_0$/blocks.21/self_attn/Cast_1_output_0/blocks.21/self_attn/Cast_1"Cast* to )/blocks.21/self_attn/Constant_10_output_0 /blocks.21/self_attn/Constant_10"Constant*H value*<B,/blocks.21/self_attn/Constant_10_attr::valueJ )/blocks.21/self_attn/Constant_11_output_0 /blocks.21/self_attn/Constant_11"Constant*H value*<B,/blocks.21/self_attn/Constant_11_attr::valueJ )/blocks.21/self_attn/Constant_12_output_0 /blocks.21/self_attn/Constant_12"Constant*H value*<B,/blocks.21/self_attn/Constant_12_attr::valueJ  $/blocks.21/self_attn/Cast_1_output_0 )/blocks.21/self_attn/Constant_12_output_0)/blocks.21/self_attn/Unsqueeze_6_output_0 /blocks.21/self_attn/Unsqueeze_6" Unsqueeze )/blocks.21/self_attn/Constant_13_output_0 /blocks.21/self_attn/Constant_13"Constant*H value*<B,/blocks.21/self_attn/Constant_13_attr::valueJ  +/blocks.21/self_attn/q_norm/Cast_2_output_0 )/blocks.21/self_attn/Constant_11_output_0 )/blocks.21/self_attn/Unsqueeze_6_output_0 )/blocks.21/self_attn/Constant_10_output_0 )/blocks.21/self_attn/Constant_13_output_0#/blocks.21/self_attn/Slice_output_0/blocks.21/self_attn/Slice"Slice )/blocks.21/self_attn/Constant_14_output_0 /blocks.21/self_attn/Constant_14"Constant*H value*<B,/blocks.21/self_attn/Constant_14_attr::valueJ )/blocks.21/self_attn/Constant_15_output_0 /blocks.21/self_attn/Constant_15"Constant*H value*<B,/blocks.21/self_attn/Constant_15_attr::valueJ  $/blocks.21/self_attn/Cast_1_output_0 )/blocks.21/self_attn/Constant_15_output_0)/blocks.21/self_attn/Unsqueeze_7_output_0 /blocks.21/self_attn/Unsqueeze_7" Unsqueeze )/blocks.21/self_attn/Constant_16_output_0 /blocks.21/self_attn/Constant_16"Constant*H value*<B,/blocks.21/self_attn/Constant_16_attr::valueJ )/blocks.21/self_attn/Constant_17_output_0 /blocks.21/self_attn/Constant_17"Constant*H value*<B,/blocks.21/self_attn/Constant_17_attr::valueJ  +/blocks.21/self_attn/q_norm/Cast_2_output_0 )/blocks.21/self_attn/Unsqueeze_7_output_0 )/blocks.21/self_attn/Constant_16_output_0 )/blocks.21/self_attn/Constant_14_output_0 )/blocks.21/self_attn/Constant_17_output_0%/blocks.21/self_attn/Slice_1_output_0/blocks.21/self_attn/Slice_1"Slice i %/blocks.21/self_attn/Slice_1_output_0!/blocks.21/self_attn/Neg_output_0/blocks.21/self_attn/Neg"Neg  !/blocks.21/self_attn/Neg_output_0 #/blocks.21/self_attn/Slice_output_0&/blocks.21/self_attn/Concat_3_output_0/blocks.21/self_attn/Concat_3"Concat* axis  &/blocks.21/self_attn/Concat_3_output_0 %/blocks.0/self_attn/Gather_3_output_0#/blocks.21/self_attn/Mul_1_output_0/blocks.21/self_attn/Mul_1"Mul  !/blocks.21/self_attn/Mul_output_0 #/blocks.21/self_attn/Mul_1_output_0!/blocks.21/self_attn/Add_output_0/blocks.21/self_attn/Add"Add  +/blocks.21/self_attn/k_norm/Cast_2_output_0 %/blocks.0/self_attn/Gather_2_output_0#/blocks.21/self_attn/Mul_2_output_0/blocks.21/self_attn/Mul_2"Mul y +/blocks.21/self_attn/k_norm/Cast_2_output_0%/blocks.21/self_attn/Shape_3_output_0/blocks.21/self_attn/Shape_3"Shape )/blocks.21/self_attn/Constant_18_output_0 /blocks.21/self_attn/Constant_18"Constant*F value*:B,/blocks.21/self_attn/Constant_18_attr::valueJ  %/blocks.21/self_attn/Shape_3_output_0 )/blocks.21/self_attn/Constant_18_output_0&/blocks.21/self_attn/Gather_3_output_0/blocks.21/self_attn/Gather_3"Gather* axis )/blocks.21/self_attn/Constant_19_output_0 /blocks.21/self_attn/Constant_19"Constant*F value*:B,/blocks.21/self_attn/Constant_19_attr::valueJ  &/blocks.21/self_attn/Gather_3_output_0 )/blocks.21/self_attn/Constant_19_output_0#/blocks.21/self_attn/Div_1_output_0/blocks.21/self_attn/Div_1"Div y #/blocks.21/self_attn/Div_1_output_0$/blocks.21/self_attn/Cast_2_output_0/blocks.21/self_attn/Cast_2"Cast* to z $/blocks.21/self_attn/Cast_2_output_0$/blocks.21/self_attn/Cast_3_output_0/blocks.21/self_attn/Cast_3"Cast* to )/blocks.21/self_attn/Constant_20_output_0 /blocks.21/self_attn/Constant_20"Constant*H value*<B,/blocks.21/self_attn/Constant_20_attr::valueJ )/blocks.21/self_attn/Constant_21_output_0 /blocks.21/self_attn/Constant_21"Constant*H value*<B,/blocks.21/self_attn/Constant_21_attr::valueJ )/blocks.21/self_attn/Constant_22_output_0 /blocks.21/self_attn/Constant_22"Constant*H value*<B,/blocks.21/self_attn/Constant_22_attr::valueJ  $/blocks.21/self_attn/Cast_3_output_0 )/blocks.21/self_attn/Constant_22_output_0)/blocks.21/self_attn/Unsqueeze_8_output_0 /blocks.21/self_attn/Unsqueeze_8" Unsqueeze )/blocks.21/self_attn/Constant_23_output_0 /blocks.21/self_attn/Constant_23"Constant*H value*<B,/blocks.21/self_attn/Constant_23_attr::valueJ  +/blocks.21/self_attn/k_norm/Cast_2_output_0 )/blocks.21/self_attn/Constant_21_output_0 )/blocks.21/self_attn/Unsqueeze_8_output_0 )/blocks.21/self_attn/Constant_20_output_0 )/blocks.21/self_attn/Constant_23_output_0%/blocks.21/self_attn/Slice_2_output_0/blocks.21/self_attn/Slice_2"Slice )/blocks.21/self_attn/Constant_24_output_0 /blocks.21/self_attn/Constant_24"Constant*H value*<B,/blocks.21/self_attn/Constant_24_attr::valueJ )/blocks.21/self_attn/Constant_25_output_0 /blocks.21/self_attn/Constant_25"Constant*H value*<B,/blocks.21/self_attn/Constant_25_attr::valueJ  $/blocks.21/self_attn/Cast_3_output_0 )/blocks.21/self_attn/Constant_25_output_0)/blocks.21/self_attn/Unsqueeze_9_output_0 /blocks.21/self_attn/Unsqueeze_9" Unsqueeze )/blocks.21/self_attn/Constant_26_output_0 /blocks.21/self_attn/Constant_26"Constant*H value*<B,/blocks.21/self_attn/Constant_26_attr::valueJ )/blocks.21/self_attn/Constant_27_output_0 /blocks.21/self_attn/Constant_27"Constant*H value*<B,/blocks.21/self_attn/Constant_27_attr::valueJ  +/blocks.21/self_attn/k_norm/Cast_2_output_0 )/blocks.21/self_attn/Unsqueeze_9_output_0 )/blocks.21/self_attn/Constant_26_output_0 )/blocks.21/self_attn/Constant_24_output_0 )/blocks.21/self_attn/Constant_27_output_0%/blocks.21/self_attn/Slice_3_output_0/blocks.21/self_attn/Slice_3"Slice m %/blocks.21/self_attn/Slice_3_output_0#/blocks.21/self_attn/Neg_1_output_0/blocks.21/self_attn/Neg_1"Neg  #/blocks.21/self_attn/Neg_1_output_0 %/blocks.21/self_attn/Slice_2_output_0&/blocks.21/self_attn/Concat_4_output_0/blocks.21/self_attn/Concat_4"Concat* axis  &/blocks.21/self_attn/Concat_4_output_0 %/blocks.0/self_attn/Gather_3_output_0#/blocks.21/self_attn/Mul_3_output_0/blocks.21/self_attn/Mul_3"Mul  #/blocks.21/self_attn/Mul_2_output_0 #/blocks.21/self_attn/Mul_3_output_0#/blocks.21/self_attn/Add_1_output_0/blocks.21/self_attn/Add_1"Add  /Gather_21_output_0 /rotary/Constant_3_output_0&/blocks.21/self_attn/Gather_4_output_0/blocks.21/self_attn/Gather_4"Gather* axis  /Gather_21_output_0 /rotary/Constant_8_output_0&/blocks.21/self_attn/Gather_5_output_0/blocks.21/self_attn/Gather_5"Gather* axis  &/blocks.21/self_attn/Gather_4_output_0 #/blocks.21/self_attn/Add_1_output_0&/blocks.21/self_attn/Concat_5_output_0/blocks.21/self_attn/Concat_5"Concat* axis  &/blocks.21/self_attn/Gather_5_output_0 '/blocks.21/self_attn/Reshape_2_output_0&/blocks.21/self_attn/Concat_6_output_0/blocks.21/self_attn/Concat_6"Concat* axis )/blocks.21/self_attn/Constant_28_output_0 /blocks.21/self_attn/Constant_28"Constant*H value*<B,/blocks.21/self_attn/Constant_28_attr::valueJ  &/blocks.21/self_attn/Concat_5_output_0 )/blocks.21/self_attn/Constant_28_output_0*/blocks.21/self_attn/Unsqueeze_10_output_0!/blocks.21/self_attn/Unsqueeze_10" Unsqueeze )/blocks.21/self_attn/Constant_29_output_0 /blocks.21/self_attn/Constant_29"Constant*H value*<B,/blocks.21/self_attn/Constant_29_attr::valueJ  &/blocks.21/self_attn/Concat_6_output_0 )/blocks.21/self_attn/Constant_29_output_0*/blocks.21/self_attn/Unsqueeze_11_output_0!/blocks.21/self_attn/Unsqueeze_11" Unsqueeze  */blocks.21/self_attn/Unsqueeze_10_output_0 */blocks.21/self_attn/Unsqueeze_11_output_0&/blocks.21/self_attn/Concat_7_output_0/blocks.21/self_attn/Concat_7"Concat* axis  !/blocks.21/self_attn/Add_output_0'/blocks.21/self_attn/Transpose_output_0/blocks.21/self_attn/Transpose" Transpose* perm@@@@  &/blocks.21/self_attn/Concat_5_output_0)/blocks.21/self_attn/Transpose_1_output_0 /blocks.21/self_attn/Transpose_1" Transpose* perm@@@@  &/blocks.21/self_attn/Concat_6_output_0)/blocks.21/self_attn/Transpose_2_output_0 /blocks.21/self_attn/Transpose_2" Transpose* perm@@@@ w )/blocks.21/self_attn/Transpose_1_output_0%/blocks.21/self_attn/Shape_4_output_0/blocks.21/self_attn/Shape_4"Shape )/blocks.21/self_attn/Constant_30_output_0 /blocks.21/self_attn/Constant_30"Constant*F value*:B,/blocks.21/self_attn/Constant_30_attr::valueJ  %/blocks.21/self_attn/Shape_4_output_0 )/blocks.21/self_attn/Constant_30_output_0&/blocks.21/self_attn/Gather_6_output_0/blocks.21/self_attn/Gather_6"Gather* axis w )/blocks.21/self_attn/Transpose_1_output_0%/blocks.21/self_attn/Shape_5_output_0/blocks.21/self_attn/Shape_5"Shape )/blocks.21/self_attn/Constant_31_output_0 /blocks.21/self_attn/Constant_31"Constant*F value*:B,/blocks.21/self_attn/Constant_31_attr::valueJ  %/blocks.21/self_attn/Shape_5_output_0 )/blocks.21/self_attn/Constant_31_output_0&/blocks.21/self_attn/Gather_7_output_0/blocks.21/self_attn/Gather_7"Gather* axis w )/blocks.21/self_attn/Transpose_1_output_0%/blocks.21/self_attn/Shape_6_output_0/blocks.21/self_attn/Shape_6"Shape )/blocks.21/self_attn/Constant_32_output_0 /blocks.21/self_attn/Constant_32"Constant*F value*:B,/blocks.21/self_attn/Constant_32_attr::valueJ  %/blocks.21/self_attn/Shape_6_output_0 )/blocks.21/self_attn/Constant_32_output_0&/blocks.21/self_attn/Gather_8_output_0/blocks.21/self_attn/Gather_8"Gather* axis w )/blocks.21/self_attn/Transpose_1_output_0%/blocks.21/self_attn/Shape_7_output_0/blocks.21/self_attn/Shape_7"Shape )/blocks.21/self_attn/Constant_33_output_0 /blocks.21/self_attn/Constant_33"Constant*F value*:B,/blocks.21/self_attn/Constant_33_attr::valueJ  %/blocks.21/self_attn/Shape_7_output_0 )/blocks.21/self_attn/Constant_33_output_0&/blocks.21/self_attn/Gather_9_output_0/blocks.21/self_attn/Gather_9"Gather* axis )/blocks.21/self_attn/Constant_34_output_0 /blocks.21/self_attn/Constant_34"Constant*H value*<B,/blocks.21/self_attn/Constant_34_attr::valueJ  )/blocks.21/self_attn/Transpose_1_output_0 )/blocks.21/self_attn/Constant_34_output_0*/blocks.21/self_attn/Unsqueeze_12_output_0!/blocks.21/self_attn/Unsqueeze_12" Unsqueeze )/blocks.21/self_attn/Constant_35_output_0 /blocks.21/self_attn/Constant_35"Constant*H value*<B,/blocks.21/self_attn/Constant_35_attr::valueJ  &/blocks.21/self_attn/Gather_6_output_0 )/blocks.21/self_attn/Constant_35_output_0*/blocks.21/self_attn/Unsqueeze_13_output_0!/blocks.21/self_attn/Unsqueeze_13" Unsqueeze )/blocks.21/self_attn/Constant_36_output_0 /blocks.21/self_attn/Constant_36"Constant*H value*<B,/blocks.21/self_attn/Constant_36_attr::valueJ  &/blocks.21/self_attn/Gather_7_output_0 )/blocks.21/self_attn/Constant_36_output_0*/blocks.21/self_attn/Unsqueeze_14_output_0!/blocks.21/self_attn/Unsqueeze_14" Unsqueeze )/blocks.21/self_attn/Constant_37_output_0 /blocks.21/self_attn/Constant_37"Constant*H value*<B,/blocks.21/self_attn/Constant_37_attr::valueJ )/blocks.21/self_attn/Constant_38_output_0 /blocks.21/self_attn/Constant_38"Constant*H value*<B,/blocks.21/self_attn/Constant_38_attr::valueJ  &/blocks.21/self_attn/Gather_8_output_0 )/blocks.21/self_attn/Constant_38_output_0*/blocks.21/self_attn/Unsqueeze_15_output_0!/blocks.21/self_attn/Unsqueeze_15" Unsqueeze )/blocks.21/self_attn/Constant_39_output_0 /blocks.21/self_attn/Constant_39"Constant*H value*<B,/blocks.21/self_attn/Constant_39_attr::valueJ  &/blocks.21/self_attn/Gather_9_output_0 )/blocks.21/self_attn/Constant_39_output_0*/blocks.21/self_attn/Unsqueeze_16_output_0!/blocks.21/self_attn/Unsqueeze_16" Unsqueeze  */blocks.21/self_attn/Unsqueeze_13_output_0 */blocks.21/self_attn/Unsqueeze_14_output_0 )/blocks.21/self_attn/Constant_37_output_0 */blocks.21/self_attn/Unsqueeze_15_output_0 */blocks.21/self_attn/Unsqueeze_16_output_0&/blocks.21/self_attn/Concat_8_output_0/blocks.21/self_attn/Concat_8"Concat* axis )/blocks.21/self_attn/Constant_40_output_0 /blocks.21/self_attn/Constant_40"Constant*H value*<B,/blocks.21/self_attn/Constant_40_attr::valueJ  &/blocks.21/self_attn/Concat_8_output_0 )/blocks.21/self_attn/Constant_40_output_0'/blocks.21/self_attn/Reshape_3_output_0/blocks.21/self_attn/Reshape_3"Reshape* allowzero u '/blocks.21/self_attn/Reshape_3_output_0%/blocks.21/self_attn/Shape_8_output_0/blocks.21/self_attn/Shape_8"Shape  %/blocks.21/self_attn/Shape_8_output_0-/blocks.21/self_attn/ConstantOfShape_output_0$/blocks.21/self_attn/ConstantOfShape"ConstantOfShape*L value*@B0/blocks.21/self_attn/ConstantOfShape_attr::valueJ )/blocks.21/self_attn/Constant_41_output_0 /blocks.21/self_attn/Constant_41"Constant*F value*:B,/blocks.21/self_attn/Constant_41_attr::valueJ  -/blocks.21/self_attn/ConstantOfShape_output_0 )/blocks.21/self_attn/Constant_41_output_0#/blocks.21/self_attn/Mul_4_output_0/blocks.21/self_attn/Mul_4"Mul  '/blocks.21/self_attn/Reshape_3_output_0 #/blocks.21/self_attn/Mul_4_output_0#/blocks.21/self_attn/Equal_output_0/blocks.21/self_attn/Equal"Equal  #/blocks.21/self_attn/Equal_output_0 -/blocks.21/self_attn/ConstantOfShape_output_0 '/blocks.21/self_attn/Reshape_3_output_0#/blocks.21/self_attn/Where_output_0/blocks.21/self_attn/Where"Where  */blocks.21/self_attn/Unsqueeze_12_output_0 #/blocks.21/self_attn/Where_output_0$/blocks.21/self_attn/Expand_output_0/blocks.21/self_attn/Expand"Expand )/blocks.21/self_attn/Constant_42_output_0 /blocks.21/self_attn/Constant_42"Constant*F value*:B,/blocks.21/self_attn/Constant_42_attr::valueJ  &/blocks.21/self_attn/Gather_7_output_0 )/blocks.21/self_attn/Constant_42_output_0#/blocks.21/self_attn/Mul_5_output_0/blocks.21/self_attn/Mul_5"Mul fonnx::Unsqueeze_6642 Constant_8217"Constant*5 value*)BConstant_8217_attr::valueJ  &/blocks.21/self_attn/Gather_6_output_0 onnx::Unsqueeze_6642*/blocks.21/self_attn/Unsqueeze_17_output_0!/blocks.21/self_attn/Unsqueeze_17" Unsqueeze fonnx::Unsqueeze_6644 Constant_8219"Constant*5 value*)BConstant_8219_attr::valueJ  #/blocks.21/self_attn/Mul_5_output_0 onnx::Unsqueeze_6644*/blocks.21/self_attn/Unsqueeze_18_output_0!/blocks.21/self_attn/Unsqueeze_18" Unsqueeze fonnx::Unsqueeze_6646 Constant_8221"Constant*5 value*)BConstant_8221_attr::valueJ  &/blocks.21/self_attn/Gather_8_output_0 onnx::Unsqueeze_6646*/blocks.21/self_attn/Unsqueeze_19_output_0!/blocks.21/self_attn/Unsqueeze_19" Unsqueeze fonnx::Unsqueeze_6648 Constant_8223"Constant*5 value*)BConstant_8223_attr::valueJ  &/blocks.21/self_attn/Gather_9_output_0 onnx::Unsqueeze_6648*/blocks.21/self_attn/Unsqueeze_20_output_0!/blocks.21/self_attn/Unsqueeze_20" Unsqueeze  */blocks.21/self_attn/Unsqueeze_17_output_0 */blocks.21/self_attn/Unsqueeze_18_output_0 */blocks.21/self_attn/Unsqueeze_19_output_0 */blocks.21/self_attn/Unsqueeze_20_output_0&/blocks.21/self_attn/Concat_9_output_0/blocks.21/self_attn/Concat_9"Concat* axis  $/blocks.21/self_attn/Expand_output_0 &/blocks.21/self_attn/Concat_9_output_0'/blocks.21/self_attn/Reshape_4_output_0/blocks.21/self_attn/Reshape_4"Reshape* allowzero w )/blocks.21/self_attn/Transpose_2_output_0%/blocks.21/self_attn/Shape_9_output_0/blocks.21/self_attn/Shape_9"Shape )/blocks.21/self_attn/Constant_43_output_0 /blocks.21/self_attn/Constant_43"Constant*F value*:B,/blocks.21/self_attn/Constant_43_attr::valueJ  %/blocks.21/self_attn/Shape_9_output_0 )/blocks.21/self_attn/Constant_43_output_0'/blocks.21/self_attn/Gather_10_output_0/blocks.21/self_attn/Gather_10"Gather* axis y )/blocks.21/self_attn/Transpose_2_output_0&/blocks.21/self_attn/Shape_10_output_0/blocks.21/self_attn/Shape_10"Shape )/blocks.21/self_attn/Constant_44_output_0 /blocks.21/self_attn/Constant_44"Constant*F value*:B,/blocks.21/self_attn/Constant_44_attr::valueJ  &/blocks.21/self_attn/Shape_10_output_0 )/blocks.21/self_attn/Constant_44_output_0'/blocks.21/self_attn/Gather_11_output_0/blocks.21/self_attn/Gather_11"Gather* axis y )/blocks.21/self_attn/Transpose_2_output_0&/blocks.21/self_attn/Shape_11_output_0/blocks.21/self_attn/Shape_11"Shape )/blocks.21/self_attn/Constant_45_output_0 /blocks.21/self_attn/Constant_45"Constant*F value*:B,/blocks.21/self_attn/Constant_45_attr::valueJ  &/blocks.21/self_attn/Shape_11_output_0 )/blocks.21/self_attn/Constant_45_output_0'/blocks.21/self_attn/Gather_12_output_0/blocks.21/self_attn/Gather_12"Gather* axis y )/blocks.21/self_attn/Transpose_2_output_0&/blocks.21/self_attn/Shape_12_output_0/blocks.21/self_attn/Shape_12"Shape )/blocks.21/self_attn/Constant_46_output_0 /blocks.21/self_attn/Constant_46"Constant*F value*:B,/blocks.21/self_attn/Constant_46_attr::valueJ  &/blocks.21/self_attn/Shape_12_output_0 )/blocks.21/self_attn/Constant_46_output_0'/blocks.21/self_attn/Gather_13_output_0/blocks.21/self_attn/Gather_13"Gather* axis )/blocks.21/self_attn/Constant_47_output_0 /blocks.21/self_attn/Constant_47"Constant*H value*<B,/blocks.21/self_attn/Constant_47_attr::valueJ  )/blocks.21/self_attn/Transpose_2_output_0 )/blocks.21/self_attn/Constant_47_output_0*/blocks.21/self_attn/Unsqueeze_21_output_0!/blocks.21/self_attn/Unsqueeze_21" Unsqueeze )/blocks.21/self_attn/Constant_48_output_0 /blocks.21/self_attn/Constant_48"Constant*H value*<B,/blocks.21/self_attn/Constant_48_attr::valueJ  '/blocks.21/self_attn/Gather_10_output_0 )/blocks.21/self_attn/Constant_48_output_0*/blocks.21/self_attn/Unsqueeze_22_output_0!/blocks.21/self_attn/Unsqueeze_22" Unsqueeze )/blocks.21/self_attn/Constant_49_output_0 /blocks.21/self_attn/Constant_49"Constant*H value*<B,/blocks.21/self_attn/Constant_49_attr::valueJ  '/blocks.21/self_attn/Gather_11_output_0 )/blocks.21/self_attn/Constant_49_output_0*/blocks.21/self_attn/Unsqueeze_23_output_0!/blocks.21/self_attn/Unsqueeze_23" Unsqueeze )/blocks.21/self_attn/Constant_50_output_0 /blocks.21/self_attn/Constant_50"Constant*H value*<B,/blocks.21/self_attn/Constant_50_attr::valueJ )/blocks.21/self_attn/Constant_51_output_0 /blocks.21/self_attn/Constant_51"Constant*H value*<B,/blocks.21/self_attn/Constant_51_attr::valueJ  '/blocks.21/self_attn/Gather_12_output_0 )/blocks.21/self_attn/Constant_51_output_0*/blocks.21/self_attn/Unsqueeze_24_output_0!/blocks.21/self_attn/Unsqueeze_24" Unsqueeze )/blocks.21/self_attn/Constant_52_output_0 /blocks.21/self_attn/Constant_52"Constant*H value*<B,/blocks.21/self_attn/Constant_52_attr::valueJ  '/blocks.21/self_attn/Gather_13_output_0 )/blocks.21/self_attn/Constant_52_output_0*/blocks.21/self_attn/Unsqueeze_25_output_0!/blocks.21/self_attn/Unsqueeze_25" Unsqueeze  */blocks.21/self_attn/Unsqueeze_22_output_0 */blocks.21/self_attn/Unsqueeze_23_output_0 )/blocks.21/self_attn/Constant_50_output_0 */blocks.21/self_attn/Unsqueeze_24_output_0 */blocks.21/self_attn/Unsqueeze_25_output_0'/blocks.21/self_attn/Concat_10_output_0/blocks.21/self_attn/Concat_10"Concat* axis )/blocks.21/self_attn/Constant_53_output_0 /blocks.21/self_attn/Constant_53"Constant*H value*<B,/blocks.21/self_attn/Constant_53_attr::valueJ  '/blocks.21/self_attn/Concat_10_output_0 )/blocks.21/self_attn/Constant_53_output_0'/blocks.21/self_attn/Reshape_5_output_0/blocks.21/self_attn/Reshape_5"Reshape* allowzero w '/blocks.21/self_attn/Reshape_5_output_0&/blocks.21/self_attn/Shape_13_output_0/blocks.21/self_attn/Shape_13"Shape  &/blocks.21/self_attn/Shape_13_output_0//blocks.21/self_attn/ConstantOfShape_1_output_0&/blocks.21/self_attn/ConstantOfShape_1"ConstantOfShape*N value*BB2/blocks.21/self_attn/ConstantOfShape_1_attr::valueJ )/blocks.21/self_attn/Constant_54_output_0 /blocks.21/self_attn/Constant_54"Constant*F value*:B,/blocks.21/self_attn/Constant_54_attr::valueJ  //blocks.21/self_attn/ConstantOfShape_1_output_0 )/blocks.21/self_attn/Constant_54_output_0#/blocks.21/self_attn/Mul_6_output_0/blocks.21/self_attn/Mul_6"Mul  '/blocks.21/self_attn/Reshape_5_output_0 #/blocks.21/self_attn/Mul_6_output_0%/blocks.21/self_attn/Equal_1_output_0/blocks.21/self_attn/Equal_1"Equal  %/blocks.21/self_attn/Equal_1_output_0 //blocks.21/self_attn/ConstantOfShape_1_output_0 '/blocks.21/self_attn/Reshape_5_output_0%/blocks.21/self_attn/Where_1_output_0/blocks.21/self_attn/Where_1"Where  */blocks.21/self_attn/Unsqueeze_21_output_0 %/blocks.21/self_attn/Where_1_output_0&/blocks.21/self_attn/Expand_1_output_0/blocks.21/self_attn/Expand_1"Expand )/blocks.21/self_attn/Constant_55_output_0 /blocks.21/self_attn/Constant_55"Constant*F value*:B,/blocks.21/self_attn/Constant_55_attr::valueJ  '/blocks.21/self_attn/Gather_11_output_0 )/blocks.21/self_attn/Constant_55_output_0#/blocks.21/self_attn/Mul_7_output_0/blocks.21/self_attn/Mul_7"Mul fonnx::Unsqueeze_6688 Constant_8262"Constant*5 value*)BConstant_8262_attr::valueJ  '/blocks.21/self_attn/Gather_10_output_0 onnx::Unsqueeze_6688*/blocks.21/self_attn/Unsqueeze_26_output_0!/blocks.21/self_attn/Unsqueeze_26" Unsqueeze fonnx::Unsqueeze_6690 Constant_8264"Constant*5 value*)BConstant_8264_attr::valueJ  #/blocks.21/self_attn/Mul_7_output_0 onnx::Unsqueeze_6690*/blocks.21/self_attn/Unsqueeze_27_output_0!/blocks.21/self_attn/Unsqueeze_27" Unsqueeze fonnx::Unsqueeze_6692 Constant_8266"Constant*5 value*)BConstant_8266_attr::valueJ  '/blocks.21/self_attn/Gather_12_output_0 onnx::Unsqueeze_6692*/blocks.21/self_attn/Unsqueeze_28_output_0!/blocks.21/self_attn/Unsqueeze_28" Unsqueeze fonnx::Unsqueeze_6694 Constant_8268"Constant*5 value*)BConstant_8268_attr::valueJ  '/blocks.21/self_attn/Gather_13_output_0 onnx::Unsqueeze_6694*/blocks.21/self_attn/Unsqueeze_29_output_0!/blocks.21/self_attn/Unsqueeze_29" Unsqueeze  */blocks.21/self_attn/Unsqueeze_26_output_0 */blocks.21/self_attn/Unsqueeze_27_output_0 */blocks.21/self_attn/Unsqueeze_28_output_0 */blocks.21/self_attn/Unsqueeze_29_output_0'/blocks.21/self_attn/Concat_11_output_0/blocks.21/self_attn/Concat_11"Concat* axis  &/blocks.21/self_attn/Expand_1_output_0 '/blocks.21/self_attn/Concat_11_output_0'/blocks.21/self_attn/Reshape_6_output_0/blocks.21/self_attn/Reshape_6"Reshape* allowzero  '/blocks.21/self_attn/Transpose_output_0 '/blocks.21/self_attn/Reshape_4_output_0$/blocks.21/self_attn/MatMul_output_0/blocks.21/self_attn/MatMul"MatMul )/blocks.21/self_attn/Constant_56_output_0 /blocks.21/self_attn/Constant_56"Constant*B value*6B,/blocks.21/self_attn/Constant_56_attr::valueJ5A  $/blocks.21/self_attn/MatMul_output_0 )/blocks.21/self_attn/Constant_56_output_0#/blocks.21/self_attn/Div_2_output_0/blocks.21/self_attn/Div_2"Div { #/blocks.21/self_attn/Div_2_output_0 attention_mask#/blocks.21/self_attn/Add_2_output_0/blocks.21/self_attn/Add_2"Add  #/blocks.21/self_attn/Add_2_output_0%/blocks.21/self_attn/Softmax_output_0/blocks.21/self_attn/Softmax"Softmax* axis { %/blocks.21/self_attn/Softmax_output_0$/blocks.21/self_attn/Cast_4_output_0/blocks.21/self_attn/Cast_4"Cast* to  $/blocks.21/self_attn/Cast_4_output_0 '/blocks.21/self_attn/Reshape_6_output_0&/blocks.21/self_attn/MatMul_1_output_0/blocks.21/self_attn/MatMul_1"MatMul  &/blocks.21/self_attn/MatMul_1_output_0)/blocks.21/self_attn/Transpose_3_output_0 /blocks.21/self_attn/Transpose_3" Transpose* perm@@@@ fonnx::Unsqueeze_6706 Constant_8280"Constant*5 value*)BConstant_8280_attr::valueJ  $/blocks.21/self_attn/Gather_output_0 onnx::Unsqueeze_6706*/blocks.21/self_attn/Unsqueeze_30_output_0!/blocks.21/self_attn/Unsqueeze_30" Unsqueeze fonnx::Unsqueeze_6708 Constant_8282"Constant*5 value*)BConstant_8282_attr::valueJ  &/blocks.21/self_attn/Gather_1_output_0 onnx::Unsqueeze_6708*/blocks.21/self_attn/Unsqueeze_31_output_0!/blocks.21/self_attn/Unsqueeze_31" Unsqueeze )/blocks.21/self_attn/Constant_57_output_0 /blocks.21/self_attn/Constant_57"Constant*H value*<B,/blocks.21/self_attn/Constant_57_attr::valueJ  */blocks.21/self_attn/Unsqueeze_30_output_0 */blocks.21/self_attn/Unsqueeze_31_output_0 )/blocks.21/self_attn/Constant_57_output_0'/blocks.21/self_attn/Concat_12_output_0/blocks.21/self_attn/Concat_12"Concat* axis  )/blocks.21/self_attn/Transpose_3_output_0 '/blocks.21/self_attn/Concat_12_output_0'/blocks.21/self_attn/Reshape_7_output_0/blocks.21/self_attn/Reshape_7"Reshape* allowzero  '/blocks.21/self_attn/Reshape_7_output_0 onnx::MatMul_9177+/blocks.21/self_attn/o_proj/MatMul_output_0"/blocks.21/self_attn/o_proj/MatMul"MatMul  */blocks.21/input_layernorm/Cast_1_output_0 +/blocks.21/self_attn/o_proj/MatMul_output_0/blocks.21/Add_output_0/blocks.21/Add"Add  /blocks.21/Add_output_01/blocks.21/post_attention_layernorm/Cast_output_0(/blocks.21/post_attention_layernorm/Cast"Cast* to 5/blocks.21/post_attention_layernorm/Constant_output_0,/blocks.21/post_attention_layernorm/Constant"Constant*N value*BB8/blocks.21/post_attention_layernorm/Constant_attr::valueJ@  1/blocks.21/post_attention_layernorm/Cast_output_0 5/blocks.21/post_attention_layernorm/Constant_output_00/blocks.21/post_attention_layernorm/Pow_output_0'/blocks.21/post_attention_layernorm/Pow"Pow  0/blocks.21/post_attention_layernorm/Pow_output_07/blocks.21/post_attention_layernorm/ReduceMean_output_0./blocks.21/post_attention_layernorm/ReduceMean" ReduceMean* axes@* keepdims 7/blocks.21/post_attention_layernorm/Constant_1_output_0./blocks.21/post_attention_layernorm/Constant_1"Constant*P value*DB:/blocks.21/post_attention_layernorm/Constant_1_attr::valueJ75  7/blocks.21/post_attention_layernorm/ReduceMean_output_0 7/blocks.21/post_attention_layernorm/Constant_1_output_00/blocks.21/post_attention_layernorm/Add_output_0'/blocks.21/post_attention_layernorm/Add"Add  0/blocks.21/post_attention_layernorm/Add_output_01/blocks.21/post_attention_layernorm/Sqrt_output_0(/blocks.21/post_attention_layernorm/Sqrt"Sqrt 7/blocks.21/post_attention_layernorm/Constant_2_output_0./blocks.21/post_attention_layernorm/Constant_2"Constant*P value*DB:/blocks.21/post_attention_layernorm/Constant_2_attr::valueJ?  7/blocks.21/post_attention_layernorm/Constant_2_output_0 1/blocks.21/post_attention_layernorm/Sqrt_output_00/blocks.21/post_attention_layernorm/Div_output_0'/blocks.21/post_attention_layernorm/Div"Div  1/blocks.21/post_attention_layernorm/Cast_output_03/blocks.21/post_attention_layernorm/Cast_1_output_0*/blocks.21/post_attention_layernorm/Cast_1"Cast* to  3/blocks.21/post_attention_layernorm/Cast_1_output_0 0/blocks.21/post_attention_layernorm/Div_output_00/blocks.21/post_attention_layernorm/Mul_output_0'/blocks.21/post_attention_layernorm/Mul"Mul  0/blocks.21/post_attention_layernorm/Mul_output_0 )blocks.21.post_attention_layernorm.weight2/blocks.21/post_attention_layernorm/Mul_1_output_0)/blocks.21/post_attention_layernorm/Mul_1"Mul  2/blocks.21/post_attention_layernorm/Mul_1_output_03/blocks.21/post_attention_layernorm/Cast_2_output_0*/blocks.21/post_attention_layernorm/Cast_2"Cast* to  3/blocks.21/post_attention_layernorm/Cast_2_output_0 onnx::MatMul_9178(/blocks.21/mlp/gate_proj/MatMul_output_0/blocks.21/mlp/gate_proj/MatMul"MatMul z (/blocks.21/mlp/gate_proj/MatMul_output_0&/blocks.21/mlp/act_fn/Sigmoid_output_0/blocks.21/mlp/act_fn/Sigmoid"Sigmoid  (/blocks.21/mlp/gate_proj/MatMul_output_0 &/blocks.21/mlp/act_fn/Sigmoid_output_0"/blocks.21/mlp/act_fn/Mul_output_0/blocks.21/mlp/act_fn/Mul"Mul  3/blocks.21/post_attention_layernorm/Cast_2_output_0 onnx::MatMul_9179&/blocks.21/mlp/up_proj/MatMul_output_0/blocks.21/mlp/up_proj/MatMul"MatMul  "/blocks.21/mlp/act_fn/Mul_output_0 &/blocks.21/mlp/up_proj/MatMul_output_0/blocks.21/mlp/Mul_output_0/blocks.21/mlp/Mul"Mul  /blocks.21/mlp/Mul_output_0 onnx::MatMul_9180(/blocks.21/mlp/down_proj/MatMul_output_0/blocks.21/mlp/down_proj/MatMul"MatMul  3/blocks.21/post_attention_layernorm/Cast_1_output_0 (/blocks.21/mlp/down_proj/MatMul_output_0/blocks.21/Add_1_output_0/blocks.21/Add_1"Add c/Constant_14_output_0 /Constant_14"Constant*2 value*&B/Constant_14_attr::valueJ ^ past_key_values /Constant_14_output_0/Gather_22_output_0 /Gather_22"Gather* axis /blocks.22/Constant_output_0/blocks.22/Constant"Constant*K value*?B/blocks.22/Constant_attr::valueJ  /blocks.21/Add_1_output_0 /blocks.22/Constant_output_0/blocks.22/Reshape_output_0/blocks.22/Reshape"Reshape* allowzero y /blocks.22/Reshape_output_0(/blocks.22/input_layernorm/Cast_output_0/blocks.22/input_layernorm/Cast"Cast* to ,/blocks.22/input_layernorm/Constant_output_0#/blocks.22/input_layernorm/Constant"Constant*E value*9B//blocks.22/input_layernorm/Constant_attr::valueJ@  (/blocks.22/input_layernorm/Cast_output_0 ,/blocks.22/input_layernorm/Constant_output_0'/blocks.22/input_layernorm/Pow_output_0/blocks.22/input_layernorm/Pow"Pow  '/blocks.22/input_layernorm/Pow_output_0./blocks.22/input_layernorm/ReduceMean_output_0%/blocks.22/input_layernorm/ReduceMean" ReduceMean* axes@* keepdims ./blocks.22/input_layernorm/Constant_1_output_0%/blocks.22/input_layernorm/Constant_1"Constant*G value*;B1/blocks.22/input_layernorm/Constant_1_attr::valueJ75  ./blocks.22/input_layernorm/ReduceMean_output_0 ./blocks.22/input_layernorm/Constant_1_output_0'/blocks.22/input_layernorm/Add_output_0/blocks.22/input_layernorm/Add"Add z '/blocks.22/input_layernorm/Add_output_0(/blocks.22/input_layernorm/Sqrt_output_0/blocks.22/input_layernorm/Sqrt"Sqrt ./blocks.22/input_layernorm/Constant_2_output_0%/blocks.22/input_layernorm/Constant_2"Constant*G value*;B1/blocks.22/input_layernorm/Constant_2_attr::valueJ?  ./blocks.22/input_layernorm/Constant_2_output_0 (/blocks.22/input_layernorm/Sqrt_output_0'/blocks.22/input_layernorm/Div_output_0/blocks.22/input_layernorm/Div"Div  (/blocks.22/input_layernorm/Cast_output_0*/blocks.22/input_layernorm/Cast_1_output_0!/blocks.22/input_layernorm/Cast_1"Cast* to  */blocks.22/input_layernorm/Cast_1_output_0 '/blocks.22/input_layernorm/Div_output_0'/blocks.22/input_layernorm/Mul_output_0/blocks.22/input_layernorm/Mul"Mul  '/blocks.22/input_layernorm/Mul_output_0 blocks.22.input_layernorm.weight)/blocks.22/input_layernorm/Mul_1_output_0 /blocks.22/input_layernorm/Mul_1"Mul  )/blocks.22/input_layernorm/Mul_1_output_0*/blocks.22/input_layernorm/Cast_2_output_0!/blocks.22/input_layernorm/Cast_2"Cast* to t */blocks.22/input_layernorm/Cast_2_output_0#/blocks.22/self_attn/Shape_output_0/blocks.22/self_attn/Shape"Shape &/blocks.22/self_attn/Constant_output_0/blocks.22/self_attn/Constant"Constant*C value*7B)/blocks.22/self_attn/Constant_attr::valueJ  #/blocks.22/self_attn/Shape_output_0 &/blocks.22/self_attn/Constant_output_0$/blocks.22/self_attn/Gather_output_0/blocks.22/self_attn/Gather"Gather* axis x */blocks.22/input_layernorm/Cast_2_output_0%/blocks.22/self_attn/Shape_1_output_0/blocks.22/self_attn/Shape_1"Shape (/blocks.22/self_attn/Constant_1_output_0/blocks.22/self_attn/Constant_1"Constant*E value*9B+/blocks.22/self_attn/Constant_1_attr::valueJ  %/blocks.22/self_attn/Shape_1_output_0 (/blocks.22/self_attn/Constant_1_output_0&/blocks.22/self_attn/Gather_1_output_0/blocks.22/self_attn/Gather_1"Gather* axis  */blocks.22/input_layernorm/Cast_2_output_0 onnx::MatMul_9181+/blocks.22/self_attn/q_proj/MatMul_output_0"/blocks.22/self_attn/q_proj/MatMul"MatMul  */blocks.22/input_layernorm/Cast_2_output_0 onnx::MatMul_9182+/blocks.22/self_attn/k_proj/MatMul_output_0"/blocks.22/self_attn/k_proj/MatMul"MatMul  */blocks.22/input_layernorm/Cast_2_output_0 onnx::MatMul_9183+/blocks.22/self_attn/v_proj/MatMul_output_0"/blocks.22/self_attn/v_proj/MatMul"MatMul fonnx::Unsqueeze_6769 Constant_8335"Constant*5 value*)BConstant_8335_attr::valueJ  $/blocks.22/self_attn/Gather_output_0 onnx::Unsqueeze_6769'/blocks.22/self_attn/Unsqueeze_output_0/blocks.22/self_attn/Unsqueeze" Unsqueeze fonnx::Unsqueeze_6771 Constant_8337"Constant*5 value*)BConstant_8337_attr::valueJ  &/blocks.22/self_attn/Gather_1_output_0 onnx::Unsqueeze_6771)/blocks.22/self_attn/Unsqueeze_1_output_0 /blocks.22/self_attn/Unsqueeze_1" Unsqueeze (/blocks.22/self_attn/Constant_2_output_0/blocks.22/self_attn/Constant_2"Constant*G value*;B+/blocks.22/self_attn/Constant_2_attr::valueJ (/blocks.22/self_attn/Constant_3_output_0/blocks.22/self_attn/Constant_3"Constant*G value*;B+/blocks.22/self_attn/Constant_3_attr::valueJ  '/blocks.22/self_attn/Unsqueeze_output_0 )/blocks.22/self_attn/Unsqueeze_1_output_0 (/blocks.22/self_attn/Constant_2_output_0 (/blocks.22/self_attn/Constant_3_output_0$/blocks.22/self_attn/Concat_output_0/blocks.22/self_attn/Concat"Concat* axis  +/blocks.22/self_attn/q_proj/MatMul_output_0 $/blocks.22/self_attn/Concat_output_0%/blocks.22/self_attn/Reshape_output_0/blocks.22/self_attn/Reshape"Reshape* allowzero fonnx::Unsqueeze_6779 Constant_8343"Constant*5 value*)BConstant_8343_attr::valueJ  $/blocks.22/self_attn/Gather_output_0 onnx::Unsqueeze_6779)/blocks.22/self_attn/Unsqueeze_2_output_0 /blocks.22/self_attn/Unsqueeze_2" Unsqueeze fonnx::Unsqueeze_6781 Constant_8345"Constant*5 value*)BConstant_8345_attr::valueJ  &/blocks.22/self_attn/Gather_1_output_0 onnx::Unsqueeze_6781)/blocks.22/self_attn/Unsqueeze_3_output_0 /blocks.22/self_attn/Unsqueeze_3" Unsqueeze (/blocks.22/self_attn/Constant_4_output_0/blocks.22/self_attn/Constant_4"Constant*G value*;B+/blocks.22/self_attn/Constant_4_attr::valueJ (/blocks.22/self_attn/Constant_5_output_0/blocks.22/self_attn/Constant_5"Constant*G value*;B+/blocks.22/self_attn/Constant_5_attr::valueJ  )/blocks.22/self_attn/Unsqueeze_2_output_0 )/blocks.22/self_attn/Unsqueeze_3_output_0 (/blocks.22/self_attn/Constant_4_output_0 (/blocks.22/self_attn/Constant_5_output_0&/blocks.22/self_attn/Concat_1_output_0/blocks.22/self_attn/Concat_1"Concat* axis fonnx::Unsqueeze_6788 Constant_8350"Constant*5 value*)BConstant_8350_attr::valueJ  $/blocks.22/self_attn/Gather_output_0 onnx::Unsqueeze_6788)/blocks.22/self_attn/Unsqueeze_4_output_0 /blocks.22/self_attn/Unsqueeze_4" Unsqueeze fonnx::Unsqueeze_6790 Constant_8352"Constant*5 value*)BConstant_8352_attr::valueJ  &/blocks.22/self_attn/Gather_1_output_0 onnx::Unsqueeze_6790)/blocks.22/self_attn/Unsqueeze_5_output_0 /blocks.22/self_attn/Unsqueeze_5" Unsqueeze (/blocks.22/self_attn/Constant_6_output_0/blocks.22/self_attn/Constant_6"Constant*G value*;B+/blocks.22/self_attn/Constant_6_attr::valueJ (/blocks.22/self_attn/Constant_7_output_0/blocks.22/self_attn/Constant_7"Constant*G value*;B+/blocks.22/self_attn/Constant_7_attr::valueJ  )/blocks.22/self_attn/Unsqueeze_4_output_0 )/blocks.22/self_attn/Unsqueeze_5_output_0 (/blocks.22/self_attn/Constant_6_output_0 (/blocks.22/self_attn/Constant_7_output_0&/blocks.22/self_attn/Concat_2_output_0/blocks.22/self_attn/Concat_2"Concat* axis  +/blocks.22/self_attn/k_proj/MatMul_output_0 &/blocks.22/self_attn/Concat_1_output_0'/blocks.22/self_attn/Reshape_1_output_0/blocks.22/self_attn/Reshape_1"Reshape* allowzero  +/blocks.22/self_attn/v_proj/MatMul_output_0 &/blocks.22/self_attn/Concat_2_output_0'/blocks.22/self_attn/Reshape_2_output_0/blocks.22/self_attn/Reshape_2"Reshape* allowzero  %/blocks.22/self_attn/Reshape_output_0)/blocks.22/self_attn/q_norm/Cast_output_0 /blocks.22/self_attn/q_norm/Cast"Cast* to -/blocks.22/self_attn/q_norm/Constant_output_0$/blocks.22/self_attn/q_norm/Constant"Constant*F value*:B0/blocks.22/self_attn/q_norm/Constant_attr::valueJ@  )/blocks.22/self_attn/q_norm/Cast_output_0 -/blocks.22/self_attn/q_norm/Constant_output_0(/blocks.22/self_attn/q_norm/Pow_output_0/blocks.22/self_attn/q_norm/Pow"Pow  (/blocks.22/self_attn/q_norm/Pow_output_0//blocks.22/self_attn/q_norm/ReduceMean_output_0&/blocks.22/self_attn/q_norm/ReduceMean" ReduceMean* axes@* keepdims //blocks.22/self_attn/q_norm/Constant_1_output_0&/blocks.22/self_attn/q_norm/Constant_1"Constant*H value*<B2/blocks.22/self_attn/q_norm/Constant_1_attr::valueJ75  //blocks.22/self_attn/q_norm/ReduceMean_output_0 //blocks.22/self_attn/q_norm/Constant_1_output_0(/blocks.22/self_attn/q_norm/Add_output_0/blocks.22/self_attn/q_norm/Add"Add } (/blocks.22/self_attn/q_norm/Add_output_0)/blocks.22/self_attn/q_norm/Sqrt_output_0 /blocks.22/self_attn/q_norm/Sqrt"Sqrt //blocks.22/self_attn/q_norm/Constant_2_output_0&/blocks.22/self_attn/q_norm/Constant_2"Constant*H value*<B2/blocks.22/self_attn/q_norm/Constant_2_attr::valueJ?  //blocks.22/self_attn/q_norm/Constant_2_output_0 )/blocks.22/self_attn/q_norm/Sqrt_output_0(/blocks.22/self_attn/q_norm/Div_output_0/blocks.22/self_attn/q_norm/Div"Div  )/blocks.22/self_attn/q_norm/Cast_output_0+/blocks.22/self_attn/q_norm/Cast_1_output_0"/blocks.22/self_attn/q_norm/Cast_1"Cast* to  +/blocks.22/self_attn/q_norm/Cast_1_output_0 (/blocks.22/self_attn/q_norm/Div_output_0(/blocks.22/self_attn/q_norm/Mul_output_0/blocks.22/self_attn/q_norm/Mul"Mul  (/blocks.22/self_attn/q_norm/Mul_output_0 !blocks.22.self_attn.q_norm.weight*/blocks.22/self_attn/q_norm/Mul_1_output_0!/blocks.22/self_attn/q_norm/Mul_1"Mul  */blocks.22/self_attn/q_norm/Mul_1_output_0+/blocks.22/self_attn/q_norm/Cast_2_output_0"/blocks.22/self_attn/q_norm/Cast_2"Cast* to  '/blocks.22/self_attn/Reshape_1_output_0)/blocks.22/self_attn/k_norm/Cast_output_0 /blocks.22/self_attn/k_norm/Cast"Cast* to -/blocks.22/self_attn/k_norm/Constant_output_0$/blocks.22/self_attn/k_norm/Constant"Constant*F value*:B0/blocks.22/self_attn/k_norm/Constant_attr::valueJ@  )/blocks.22/self_attn/k_norm/Cast_output_0 -/blocks.22/self_attn/k_norm/Constant_output_0(/blocks.22/self_attn/k_norm/Pow_output_0/blocks.22/self_attn/k_norm/Pow"Pow  (/blocks.22/self_attn/k_norm/Pow_output_0//blocks.22/self_attn/k_norm/ReduceMean_output_0&/blocks.22/self_attn/k_norm/ReduceMean" ReduceMean* axes@* keepdims //blocks.22/self_attn/k_norm/Constant_1_output_0&/blocks.22/self_attn/k_norm/Constant_1"Constant*H value*<B2/blocks.22/self_attn/k_norm/Constant_1_attr::valueJ75  //blocks.22/self_attn/k_norm/ReduceMean_output_0 //blocks.22/self_attn/k_norm/Constant_1_output_0(/blocks.22/self_attn/k_norm/Add_output_0/blocks.22/self_attn/k_norm/Add"Add } (/blocks.22/self_attn/k_norm/Add_output_0)/blocks.22/self_attn/k_norm/Sqrt_output_0 /blocks.22/self_attn/k_norm/Sqrt"Sqrt //blocks.22/self_attn/k_norm/Constant_2_output_0&/blocks.22/self_attn/k_norm/Constant_2"Constant*H value*<B2/blocks.22/self_attn/k_norm/Constant_2_attr::valueJ?  //blocks.22/self_attn/k_norm/Constant_2_output_0 )/blocks.22/self_attn/k_norm/Sqrt_output_0(/blocks.22/self_attn/k_norm/Div_output_0/blocks.22/self_attn/k_norm/Div"Div  )/blocks.22/self_attn/k_norm/Cast_output_0+/blocks.22/self_attn/k_norm/Cast_1_output_0"/blocks.22/self_attn/k_norm/Cast_1"Cast* to  +/blocks.22/self_attn/k_norm/Cast_1_output_0 (/blocks.22/self_attn/k_norm/Div_output_0(/blocks.22/self_attn/k_norm/Mul_output_0/blocks.22/self_attn/k_norm/Mul"Mul  (/blocks.22/self_attn/k_norm/Mul_output_0 !blocks.22.self_attn.k_norm.weight*/blocks.22/self_attn/k_norm/Mul_1_output_0!/blocks.22/self_attn/k_norm/Mul_1"Mul  */blocks.22/self_attn/k_norm/Mul_1_output_0+/blocks.22/self_attn/k_norm/Cast_2_output_0"/blocks.22/self_attn/k_norm/Cast_2"Cast* to  +/blocks.22/self_attn/q_norm/Cast_2_output_0 %/blocks.0/self_attn/Gather_2_output_0!/blocks.22/self_attn/Mul_output_0/blocks.22/self_attn/Mul"Mul y +/blocks.22/self_attn/q_norm/Cast_2_output_0%/blocks.22/self_attn/Shape_2_output_0/blocks.22/self_attn/Shape_2"Shape (/blocks.22/self_attn/Constant_8_output_0/blocks.22/self_attn/Constant_8"Constant*E value*9B+/blocks.22/self_attn/Constant_8_attr::valueJ  %/blocks.22/self_attn/Shape_2_output_0 (/blocks.22/self_attn/Constant_8_output_0&/blocks.22/self_attn/Gather_2_output_0/blocks.22/self_attn/Gather_2"Gather* axis (/blocks.22/self_attn/Constant_9_output_0/blocks.22/self_attn/Constant_9"Constant*E value*9B+/blocks.22/self_attn/Constant_9_attr::valueJ  &/blocks.22/self_attn/Gather_2_output_0 (/blocks.22/self_attn/Constant_9_output_0!/blocks.22/self_attn/Div_output_0/blocks.22/self_attn/Div"Div s !/blocks.22/self_attn/Div_output_0"/blocks.22/self_attn/Cast_output_0/blocks.22/self_attn/Cast"Cast* to x "/blocks.22/self_attn/Cast_output_0$/blocks.22/self_attn/Cast_1_output_0/blocks.22/self_attn/Cast_1"Cast* to )/blocks.22/self_attn/Constant_10_output_0 /blocks.22/self_attn/Constant_10"Constant*H value*<B,/blocks.22/self_attn/Constant_10_attr::valueJ )/blocks.22/self_attn/Constant_11_output_0 /blocks.22/self_attn/Constant_11"Constant*H value*<B,/blocks.22/self_attn/Constant_11_attr::valueJ )/blocks.22/self_attn/Constant_12_output_0 /blocks.22/self_attn/Constant_12"Constant*H value*<B,/blocks.22/self_attn/Constant_12_attr::valueJ  $/blocks.22/self_attn/Cast_1_output_0 )/blocks.22/self_attn/Constant_12_output_0)/blocks.22/self_attn/Unsqueeze_6_output_0 /blocks.22/self_attn/Unsqueeze_6" Unsqueeze )/blocks.22/self_attn/Constant_13_output_0 /blocks.22/self_attn/Constant_13"Constant*H value*<B,/blocks.22/self_attn/Constant_13_attr::valueJ  +/blocks.22/self_attn/q_norm/Cast_2_output_0 )/blocks.22/self_attn/Constant_11_output_0 )/blocks.22/self_attn/Unsqueeze_6_output_0 )/blocks.22/self_attn/Constant_10_output_0 )/blocks.22/self_attn/Constant_13_output_0#/blocks.22/self_attn/Slice_output_0/blocks.22/self_attn/Slice"Slice )/blocks.22/self_attn/Constant_14_output_0 /blocks.22/self_attn/Constant_14"Constant*H value*<B,/blocks.22/self_attn/Constant_14_attr::valueJ )/blocks.22/self_attn/Constant_15_output_0 /blocks.22/self_attn/Constant_15"Constant*H value*<B,/blocks.22/self_attn/Constant_15_attr::valueJ  $/blocks.22/self_attn/Cast_1_output_0 )/blocks.22/self_attn/Constant_15_output_0)/blocks.22/self_attn/Unsqueeze_7_output_0 /blocks.22/self_attn/Unsqueeze_7" Unsqueeze )/blocks.22/self_attn/Constant_16_output_0 /blocks.22/self_attn/Constant_16"Constant*H value*<B,/blocks.22/self_attn/Constant_16_attr::valueJ )/blocks.22/self_attn/Constant_17_output_0 /blocks.22/self_attn/Constant_17"Constant*H value*<B,/blocks.22/self_attn/Constant_17_attr::valueJ  +/blocks.22/self_attn/q_norm/Cast_2_output_0 )/blocks.22/self_attn/Unsqueeze_7_output_0 )/blocks.22/self_attn/Constant_16_output_0 )/blocks.22/self_attn/Constant_14_output_0 )/blocks.22/self_attn/Constant_17_output_0%/blocks.22/self_attn/Slice_1_output_0/blocks.22/self_attn/Slice_1"Slice i %/blocks.22/self_attn/Slice_1_output_0!/blocks.22/self_attn/Neg_output_0/blocks.22/self_attn/Neg"Neg  !/blocks.22/self_attn/Neg_output_0 #/blocks.22/self_attn/Slice_output_0&/blocks.22/self_attn/Concat_3_output_0/blocks.22/self_attn/Concat_3"Concat* axis  &/blocks.22/self_attn/Concat_3_output_0 %/blocks.0/self_attn/Gather_3_output_0#/blocks.22/self_attn/Mul_1_output_0/blocks.22/self_attn/Mul_1"Mul  !/blocks.22/self_attn/Mul_output_0 #/blocks.22/self_attn/Mul_1_output_0!/blocks.22/self_attn/Add_output_0/blocks.22/self_attn/Add"Add  +/blocks.22/self_attn/k_norm/Cast_2_output_0 %/blocks.0/self_attn/Gather_2_output_0#/blocks.22/self_attn/Mul_2_output_0/blocks.22/self_attn/Mul_2"Mul y +/blocks.22/self_attn/k_norm/Cast_2_output_0%/blocks.22/self_attn/Shape_3_output_0/blocks.22/self_attn/Shape_3"Shape )/blocks.22/self_attn/Constant_18_output_0 /blocks.22/self_attn/Constant_18"Constant*F value*:B,/blocks.22/self_attn/Constant_18_attr::valueJ  %/blocks.22/self_attn/Shape_3_output_0 )/blocks.22/self_attn/Constant_18_output_0&/blocks.22/self_attn/Gather_3_output_0/blocks.22/self_attn/Gather_3"Gather* axis )/blocks.22/self_attn/Constant_19_output_0 /blocks.22/self_attn/Constant_19"Constant*F value*:B,/blocks.22/self_attn/Constant_19_attr::valueJ  &/blocks.22/self_attn/Gather_3_output_0 )/blocks.22/self_attn/Constant_19_output_0#/blocks.22/self_attn/Div_1_output_0/blocks.22/self_attn/Div_1"Div y #/blocks.22/self_attn/Div_1_output_0$/blocks.22/self_attn/Cast_2_output_0/blocks.22/self_attn/Cast_2"Cast* to z $/blocks.22/self_attn/Cast_2_output_0$/blocks.22/self_attn/Cast_3_output_0/blocks.22/self_attn/Cast_3"Cast* to )/blocks.22/self_attn/Constant_20_output_0 /blocks.22/self_attn/Constant_20"Constant*H value*<B,/blocks.22/self_attn/Constant_20_attr::valueJ )/blocks.22/self_attn/Constant_21_output_0 /blocks.22/self_attn/Constant_21"Constant*H value*<B,/blocks.22/self_attn/Constant_21_attr::valueJ )/blocks.22/self_attn/Constant_22_output_0 /blocks.22/self_attn/Constant_22"Constant*H value*<B,/blocks.22/self_attn/Constant_22_attr::valueJ  $/blocks.22/self_attn/Cast_3_output_0 )/blocks.22/self_attn/Constant_22_output_0)/blocks.22/self_attn/Unsqueeze_8_output_0 /blocks.22/self_attn/Unsqueeze_8" Unsqueeze )/blocks.22/self_attn/Constant_23_output_0 /blocks.22/self_attn/Constant_23"Constant*H value*<B,/blocks.22/self_attn/Constant_23_attr::valueJ  +/blocks.22/self_attn/k_norm/Cast_2_output_0 )/blocks.22/self_attn/Constant_21_output_0 )/blocks.22/self_attn/Unsqueeze_8_output_0 )/blocks.22/self_attn/Constant_20_output_0 )/blocks.22/self_attn/Constant_23_output_0%/blocks.22/self_attn/Slice_2_output_0/blocks.22/self_attn/Slice_2"Slice )/blocks.22/self_attn/Constant_24_output_0 /blocks.22/self_attn/Constant_24"Constant*H value*<B,/blocks.22/self_attn/Constant_24_attr::valueJ )/blocks.22/self_attn/Constant_25_output_0 /blocks.22/self_attn/Constant_25"Constant*H value*<B,/blocks.22/self_attn/Constant_25_attr::valueJ  $/blocks.22/self_attn/Cast_3_output_0 )/blocks.22/self_attn/Constant_25_output_0)/blocks.22/self_attn/Unsqueeze_9_output_0 /blocks.22/self_attn/Unsqueeze_9" Unsqueeze )/blocks.22/self_attn/Constant_26_output_0 /blocks.22/self_attn/Constant_26"Constant*H value*<B,/blocks.22/self_attn/Constant_26_attr::valueJ )/blocks.22/self_attn/Constant_27_output_0 /blocks.22/self_attn/Constant_27"Constant*H value*<B,/blocks.22/self_attn/Constant_27_attr::valueJ  +/blocks.22/self_attn/k_norm/Cast_2_output_0 )/blocks.22/self_attn/Unsqueeze_9_output_0 )/blocks.22/self_attn/Constant_26_output_0 )/blocks.22/self_attn/Constant_24_output_0 )/blocks.22/self_attn/Constant_27_output_0%/blocks.22/self_attn/Slice_3_output_0/blocks.22/self_attn/Slice_3"Slice m %/blocks.22/self_attn/Slice_3_output_0#/blocks.22/self_attn/Neg_1_output_0/blocks.22/self_attn/Neg_1"Neg  #/blocks.22/self_attn/Neg_1_output_0 %/blocks.22/self_attn/Slice_2_output_0&/blocks.22/self_attn/Concat_4_output_0/blocks.22/self_attn/Concat_4"Concat* axis  &/blocks.22/self_attn/Concat_4_output_0 %/blocks.0/self_attn/Gather_3_output_0#/blocks.22/self_attn/Mul_3_output_0/blocks.22/self_attn/Mul_3"Mul  #/blocks.22/self_attn/Mul_2_output_0 #/blocks.22/self_attn/Mul_3_output_0#/blocks.22/self_attn/Add_1_output_0/blocks.22/self_attn/Add_1"Add  /Gather_22_output_0 /rotary/Constant_3_output_0&/blocks.22/self_attn/Gather_4_output_0/blocks.22/self_attn/Gather_4"Gather* axis  /Gather_22_output_0 /rotary/Constant_8_output_0&/blocks.22/self_attn/Gather_5_output_0/blocks.22/self_attn/Gather_5"Gather* axis  &/blocks.22/self_attn/Gather_4_output_0 #/blocks.22/self_attn/Add_1_output_0&/blocks.22/self_attn/Concat_5_output_0/blocks.22/self_attn/Concat_5"Concat* axis  &/blocks.22/self_attn/Gather_5_output_0 '/blocks.22/self_attn/Reshape_2_output_0&/blocks.22/self_attn/Concat_6_output_0/blocks.22/self_attn/Concat_6"Concat* axis )/blocks.22/self_attn/Constant_28_output_0 /blocks.22/self_attn/Constant_28"Constant*H value*<B,/blocks.22/self_attn/Constant_28_attr::valueJ  &/blocks.22/self_attn/Concat_5_output_0 )/blocks.22/self_attn/Constant_28_output_0*/blocks.22/self_attn/Unsqueeze_10_output_0!/blocks.22/self_attn/Unsqueeze_10" Unsqueeze )/blocks.22/self_attn/Constant_29_output_0 /blocks.22/self_attn/Constant_29"Constant*H value*<B,/blocks.22/self_attn/Constant_29_attr::valueJ  &/blocks.22/self_attn/Concat_6_output_0 )/blocks.22/self_attn/Constant_29_output_0*/blocks.22/self_attn/Unsqueeze_11_output_0!/blocks.22/self_attn/Unsqueeze_11" Unsqueeze  */blocks.22/self_attn/Unsqueeze_10_output_0 */blocks.22/self_attn/Unsqueeze_11_output_0&/blocks.22/self_attn/Concat_7_output_0/blocks.22/self_attn/Concat_7"Concat* axis  !/blocks.22/self_attn/Add_output_0'/blocks.22/self_attn/Transpose_output_0/blocks.22/self_attn/Transpose" Transpose* perm@@@@  &/blocks.22/self_attn/Concat_5_output_0)/blocks.22/self_attn/Transpose_1_output_0 /blocks.22/self_attn/Transpose_1" Transpose* perm@@@@  &/blocks.22/self_attn/Concat_6_output_0)/blocks.22/self_attn/Transpose_2_output_0 /blocks.22/self_attn/Transpose_2" Transpose* perm@@@@ w )/blocks.22/self_attn/Transpose_1_output_0%/blocks.22/self_attn/Shape_4_output_0/blocks.22/self_attn/Shape_4"Shape )/blocks.22/self_attn/Constant_30_output_0 /blocks.22/self_attn/Constant_30"Constant*F value*:B,/blocks.22/self_attn/Constant_30_attr::valueJ  %/blocks.22/self_attn/Shape_4_output_0 )/blocks.22/self_attn/Constant_30_output_0&/blocks.22/self_attn/Gather_6_output_0/blocks.22/self_attn/Gather_6"Gather* axis w )/blocks.22/self_attn/Transpose_1_output_0%/blocks.22/self_attn/Shape_5_output_0/blocks.22/self_attn/Shape_5"Shape )/blocks.22/self_attn/Constant_31_output_0 /blocks.22/self_attn/Constant_31"Constant*F value*:B,/blocks.22/self_attn/Constant_31_attr::valueJ  %/blocks.22/self_attn/Shape_5_output_0 )/blocks.22/self_attn/Constant_31_output_0&/blocks.22/self_attn/Gather_7_output_0/blocks.22/self_attn/Gather_7"Gather* axis w )/blocks.22/self_attn/Transpose_1_output_0%/blocks.22/self_attn/Shape_6_output_0/blocks.22/self_attn/Shape_6"Shape )/blocks.22/self_attn/Constant_32_output_0 /blocks.22/self_attn/Constant_32"Constant*F value*:B,/blocks.22/self_attn/Constant_32_attr::valueJ  %/blocks.22/self_attn/Shape_6_output_0 )/blocks.22/self_attn/Constant_32_output_0&/blocks.22/self_attn/Gather_8_output_0/blocks.22/self_attn/Gather_8"Gather* axis w )/blocks.22/self_attn/Transpose_1_output_0%/blocks.22/self_attn/Shape_7_output_0/blocks.22/self_attn/Shape_7"Shape )/blocks.22/self_attn/Constant_33_output_0 /blocks.22/self_attn/Constant_33"Constant*F value*:B,/blocks.22/self_attn/Constant_33_attr::valueJ  %/blocks.22/self_attn/Shape_7_output_0 )/blocks.22/self_attn/Constant_33_output_0&/blocks.22/self_attn/Gather_9_output_0/blocks.22/self_attn/Gather_9"Gather* axis )/blocks.22/self_attn/Constant_34_output_0 /blocks.22/self_attn/Constant_34"Constant*H value*<B,/blocks.22/self_attn/Constant_34_attr::valueJ  )/blocks.22/self_attn/Transpose_1_output_0 )/blocks.22/self_attn/Constant_34_output_0*/blocks.22/self_attn/Unsqueeze_12_output_0!/blocks.22/self_attn/Unsqueeze_12" Unsqueeze )/blocks.22/self_attn/Constant_35_output_0 /blocks.22/self_attn/Constant_35"Constant*H value*<B,/blocks.22/self_attn/Constant_35_attr::valueJ  &/blocks.22/self_attn/Gather_6_output_0 )/blocks.22/self_attn/Constant_35_output_0*/blocks.22/self_attn/Unsqueeze_13_output_0!/blocks.22/self_attn/Unsqueeze_13" Unsqueeze )/blocks.22/self_attn/Constant_36_output_0 /blocks.22/self_attn/Constant_36"Constant*H value*<B,/blocks.22/self_attn/Constant_36_attr::valueJ  &/blocks.22/self_attn/Gather_7_output_0 )/blocks.22/self_attn/Constant_36_output_0*/blocks.22/self_attn/Unsqueeze_14_output_0!/blocks.22/self_attn/Unsqueeze_14" Unsqueeze )/blocks.22/self_attn/Constant_37_output_0 /blocks.22/self_attn/Constant_37"Constant*H value*<B,/blocks.22/self_attn/Constant_37_attr::valueJ )/blocks.22/self_attn/Constant_38_output_0 /blocks.22/self_attn/Constant_38"Constant*H value*<B,/blocks.22/self_attn/Constant_38_attr::valueJ  &/blocks.22/self_attn/Gather_8_output_0 )/blocks.22/self_attn/Constant_38_output_0*/blocks.22/self_attn/Unsqueeze_15_output_0!/blocks.22/self_attn/Unsqueeze_15" Unsqueeze )/blocks.22/self_attn/Constant_39_output_0 /blocks.22/self_attn/Constant_39"Constant*H value*<B,/blocks.22/self_attn/Constant_39_attr::valueJ  &/blocks.22/self_attn/Gather_9_output_0 )/blocks.22/self_attn/Constant_39_output_0*/blocks.22/self_attn/Unsqueeze_16_output_0!/blocks.22/self_attn/Unsqueeze_16" Unsqueeze  */blocks.22/self_attn/Unsqueeze_13_output_0 */blocks.22/self_attn/Unsqueeze_14_output_0 )/blocks.22/self_attn/Constant_37_output_0 */blocks.22/self_attn/Unsqueeze_15_output_0 */blocks.22/self_attn/Unsqueeze_16_output_0&/blocks.22/self_attn/Concat_8_output_0/blocks.22/self_attn/Concat_8"Concat* axis )/blocks.22/self_attn/Constant_40_output_0 /blocks.22/self_attn/Constant_40"Constant*H value*<B,/blocks.22/self_attn/Constant_40_attr::valueJ  &/blocks.22/self_attn/Concat_8_output_0 )/blocks.22/self_attn/Constant_40_output_0'/blocks.22/self_attn/Reshape_3_output_0/blocks.22/self_attn/Reshape_3"Reshape* allowzero u '/blocks.22/self_attn/Reshape_3_output_0%/blocks.22/self_attn/Shape_8_output_0/blocks.22/self_attn/Shape_8"Shape  %/blocks.22/self_attn/Shape_8_output_0-/blocks.22/self_attn/ConstantOfShape_output_0$/blocks.22/self_attn/ConstantOfShape"ConstantOfShape*L value*@B0/blocks.22/self_attn/ConstantOfShape_attr::valueJ )/blocks.22/self_attn/Constant_41_output_0 /blocks.22/self_attn/Constant_41"Constant*F value*:B,/blocks.22/self_attn/Constant_41_attr::valueJ  -/blocks.22/self_attn/ConstantOfShape_output_0 )/blocks.22/self_attn/Constant_41_output_0#/blocks.22/self_attn/Mul_4_output_0/blocks.22/self_attn/Mul_4"Mul  '/blocks.22/self_attn/Reshape_3_output_0 #/blocks.22/self_attn/Mul_4_output_0#/blocks.22/self_attn/Equal_output_0/blocks.22/self_attn/Equal"Equal  #/blocks.22/self_attn/Equal_output_0 -/blocks.22/self_attn/ConstantOfShape_output_0 '/blocks.22/self_attn/Reshape_3_output_0#/blocks.22/self_attn/Where_output_0/blocks.22/self_attn/Where"Where  */blocks.22/self_attn/Unsqueeze_12_output_0 #/blocks.22/self_attn/Where_output_0$/blocks.22/self_attn/Expand_output_0/blocks.22/self_attn/Expand"Expand )/blocks.22/self_attn/Constant_42_output_0 /blocks.22/self_attn/Constant_42"Constant*F value*:B,/blocks.22/self_attn/Constant_42_attr::valueJ  &/blocks.22/self_attn/Gather_7_output_0 )/blocks.22/self_attn/Constant_42_output_0#/blocks.22/self_attn/Mul_5_output_0/blocks.22/self_attn/Mul_5"Mul fonnx::Unsqueeze_6933 Constant_8480"Constant*5 value*)BConstant_8480_attr::valueJ  &/blocks.22/self_attn/Gather_6_output_0 onnx::Unsqueeze_6933*/blocks.22/self_attn/Unsqueeze_17_output_0!/blocks.22/self_attn/Unsqueeze_17" Unsqueeze fonnx::Unsqueeze_6935 Constant_8482"Constant*5 value*)BConstant_8482_attr::valueJ  #/blocks.22/self_attn/Mul_5_output_0 onnx::Unsqueeze_6935*/blocks.22/self_attn/Unsqueeze_18_output_0!/blocks.22/self_attn/Unsqueeze_18" Unsqueeze fonnx::Unsqueeze_6937 Constant_8484"Constant*5 value*)BConstant_8484_attr::valueJ  &/blocks.22/self_attn/Gather_8_output_0 onnx::Unsqueeze_6937*/blocks.22/self_attn/Unsqueeze_19_output_0!/blocks.22/self_attn/Unsqueeze_19" Unsqueeze fonnx::Unsqueeze_6939 Constant_8486"Constant*5 value*)BConstant_8486_attr::valueJ  &/blocks.22/self_attn/Gather_9_output_0 onnx::Unsqueeze_6939*/blocks.22/self_attn/Unsqueeze_20_output_0!/blocks.22/self_attn/Unsqueeze_20" Unsqueeze  */blocks.22/self_attn/Unsqueeze_17_output_0 */blocks.22/self_attn/Unsqueeze_18_output_0 */blocks.22/self_attn/Unsqueeze_19_output_0 */blocks.22/self_attn/Unsqueeze_20_output_0&/blocks.22/self_attn/Concat_9_output_0/blocks.22/self_attn/Concat_9"Concat* axis  $/blocks.22/self_attn/Expand_output_0 &/blocks.22/self_attn/Concat_9_output_0'/blocks.22/self_attn/Reshape_4_output_0/blocks.22/self_attn/Reshape_4"Reshape* allowzero w )/blocks.22/self_attn/Transpose_2_output_0%/blocks.22/self_attn/Shape_9_output_0/blocks.22/self_attn/Shape_9"Shape )/blocks.22/self_attn/Constant_43_output_0 /blocks.22/self_attn/Constant_43"Constant*F value*:B,/blocks.22/self_attn/Constant_43_attr::valueJ  %/blocks.22/self_attn/Shape_9_output_0 )/blocks.22/self_attn/Constant_43_output_0'/blocks.22/self_attn/Gather_10_output_0/blocks.22/self_attn/Gather_10"Gather* axis y )/blocks.22/self_attn/Transpose_2_output_0&/blocks.22/self_attn/Shape_10_output_0/blocks.22/self_attn/Shape_10"Shape )/blocks.22/self_attn/Constant_44_output_0 /blocks.22/self_attn/Constant_44"Constant*F value*:B,/blocks.22/self_attn/Constant_44_attr::valueJ  &/blocks.22/self_attn/Shape_10_output_0 )/blocks.22/self_attn/Constant_44_output_0'/blocks.22/self_attn/Gather_11_output_0/blocks.22/self_attn/Gather_11"Gather* axis y )/blocks.22/self_attn/Transpose_2_output_0&/blocks.22/self_attn/Shape_11_output_0/blocks.22/self_attn/Shape_11"Shape )/blocks.22/self_attn/Constant_45_output_0 /blocks.22/self_attn/Constant_45"Constant*F value*:B,/blocks.22/self_attn/Constant_45_attr::valueJ  &/blocks.22/self_attn/Shape_11_output_0 )/blocks.22/self_attn/Constant_45_output_0'/blocks.22/self_attn/Gather_12_output_0/blocks.22/self_attn/Gather_12"Gather* axis y )/blocks.22/self_attn/Transpose_2_output_0&/blocks.22/self_attn/Shape_12_output_0/blocks.22/self_attn/Shape_12"Shape )/blocks.22/self_attn/Constant_46_output_0 /blocks.22/self_attn/Constant_46"Constant*F value*:B,/blocks.22/self_attn/Constant_46_attr::valueJ  &/blocks.22/self_attn/Shape_12_output_0 )/blocks.22/self_attn/Constant_46_output_0'/blocks.22/self_attn/Gather_13_output_0/blocks.22/self_attn/Gather_13"Gather* axis )/blocks.22/self_attn/Constant_47_output_0 /blocks.22/self_attn/Constant_47"Constant*H value*<B,/blocks.22/self_attn/Constant_47_attr::valueJ  )/blocks.22/self_attn/Transpose_2_output_0 )/blocks.22/self_attn/Constant_47_output_0*/blocks.22/self_attn/Unsqueeze_21_output_0!/blocks.22/self_attn/Unsqueeze_21" Unsqueeze )/blocks.22/self_attn/Constant_48_output_0 /blocks.22/self_attn/Constant_48"Constant*H value*<B,/blocks.22/self_attn/Constant_48_attr::valueJ  '/blocks.22/self_attn/Gather_10_output_0 )/blocks.22/self_attn/Constant_48_output_0*/blocks.22/self_attn/Unsqueeze_22_output_0!/blocks.22/self_attn/Unsqueeze_22" Unsqueeze )/blocks.22/self_attn/Constant_49_output_0 /blocks.22/self_attn/Constant_49"Constant*H value*<B,/blocks.22/self_attn/Constant_49_attr::valueJ  '/blocks.22/self_attn/Gather_11_output_0 )/blocks.22/self_attn/Constant_49_output_0*/blocks.22/self_attn/Unsqueeze_23_output_0!/blocks.22/self_attn/Unsqueeze_23" Unsqueeze )/blocks.22/self_attn/Constant_50_output_0 /blocks.22/self_attn/Constant_50"Constant*H value*<B,/blocks.22/self_attn/Constant_50_attr::valueJ )/blocks.22/self_attn/Constant_51_output_0 /blocks.22/self_attn/Constant_51"Constant*H value*<B,/blocks.22/self_attn/Constant_51_attr::valueJ  '/blocks.22/self_attn/Gather_12_output_0 )/blocks.22/self_attn/Constant_51_output_0*/blocks.22/self_attn/Unsqueeze_24_output_0!/blocks.22/self_attn/Unsqueeze_24" Unsqueeze )/blocks.22/self_attn/Constant_52_output_0 /blocks.22/self_attn/Constant_52"Constant*H value*<B,/blocks.22/self_attn/Constant_52_attr::valueJ  '/blocks.22/self_attn/Gather_13_output_0 )/blocks.22/self_attn/Constant_52_output_0*/blocks.22/self_attn/Unsqueeze_25_output_0!/blocks.22/self_attn/Unsqueeze_25" Unsqueeze  */blocks.22/self_attn/Unsqueeze_22_output_0 */blocks.22/self_attn/Unsqueeze_23_output_0 )/blocks.22/self_attn/Constant_50_output_0 */blocks.22/self_attn/Unsqueeze_24_output_0 */blocks.22/self_attn/Unsqueeze_25_output_0'/blocks.22/self_attn/Concat_10_output_0/blocks.22/self_attn/Concat_10"Concat* axis )/blocks.22/self_attn/Constant_53_output_0 /blocks.22/self_attn/Constant_53"Constant*H value*<B,/blocks.22/self_attn/Constant_53_attr::valueJ  '/blocks.22/self_attn/Concat_10_output_0 )/blocks.22/self_attn/Constant_53_output_0'/blocks.22/self_attn/Reshape_5_output_0/blocks.22/self_attn/Reshape_5"Reshape* allowzero w '/blocks.22/self_attn/Reshape_5_output_0&/blocks.22/self_attn/Shape_13_output_0/blocks.22/self_attn/Shape_13"Shape  &/blocks.22/self_attn/Shape_13_output_0//blocks.22/self_attn/ConstantOfShape_1_output_0&/blocks.22/self_attn/ConstantOfShape_1"ConstantOfShape*N value*BB2/blocks.22/self_attn/ConstantOfShape_1_attr::valueJ )/blocks.22/self_attn/Constant_54_output_0 /blocks.22/self_attn/Constant_54"Constant*F value*:B,/blocks.22/self_attn/Constant_54_attr::valueJ  //blocks.22/self_attn/ConstantOfShape_1_output_0 )/blocks.22/self_attn/Constant_54_output_0#/blocks.22/self_attn/Mul_6_output_0/blocks.22/self_attn/Mul_6"Mul  '/blocks.22/self_attn/Reshape_5_output_0 #/blocks.22/self_attn/Mul_6_output_0%/blocks.22/self_attn/Equal_1_output_0/blocks.22/self_attn/Equal_1"Equal  %/blocks.22/self_attn/Equal_1_output_0 //blocks.22/self_attn/ConstantOfShape_1_output_0 '/blocks.22/self_attn/Reshape_5_output_0%/blocks.22/self_attn/Where_1_output_0/blocks.22/self_attn/Where_1"Where  */blocks.22/self_attn/Unsqueeze_21_output_0 %/blocks.22/self_attn/Where_1_output_0&/blocks.22/self_attn/Expand_1_output_0/blocks.22/self_attn/Expand_1"Expand )/blocks.22/self_attn/Constant_55_output_0 /blocks.22/self_attn/Constant_55"Constant*F value*:B,/blocks.22/self_attn/Constant_55_attr::valueJ  '/blocks.22/self_attn/Gather_11_output_0 )/blocks.22/self_attn/Constant_55_output_0#/blocks.22/self_attn/Mul_7_output_0/blocks.22/self_attn/Mul_7"Mul fonnx::Unsqueeze_6979 Constant_8525"Constant*5 value*)BConstant_8525_attr::valueJ  '/blocks.22/self_attn/Gather_10_output_0 onnx::Unsqueeze_6979*/blocks.22/self_attn/Unsqueeze_26_output_0!/blocks.22/self_attn/Unsqueeze_26" Unsqueeze fonnx::Unsqueeze_6981 Constant_8527"Constant*5 value*)BConstant_8527_attr::valueJ  #/blocks.22/self_attn/Mul_7_output_0 onnx::Unsqueeze_6981*/blocks.22/self_attn/Unsqueeze_27_output_0!/blocks.22/self_attn/Unsqueeze_27" Unsqueeze fonnx::Unsqueeze_6983 Constant_8529"Constant*5 value*)BConstant_8529_attr::valueJ  '/blocks.22/self_attn/Gather_12_output_0 onnx::Unsqueeze_6983*/blocks.22/self_attn/Unsqueeze_28_output_0!/blocks.22/self_attn/Unsqueeze_28" Unsqueeze fonnx::Unsqueeze_6985 Constant_8531"Constant*5 value*)BConstant_8531_attr::valueJ  '/blocks.22/self_attn/Gather_13_output_0 onnx::Unsqueeze_6985*/blocks.22/self_attn/Unsqueeze_29_output_0!/blocks.22/self_attn/Unsqueeze_29" Unsqueeze  */blocks.22/self_attn/Unsqueeze_26_output_0 */blocks.22/self_attn/Unsqueeze_27_output_0 */blocks.22/self_attn/Unsqueeze_28_output_0 */blocks.22/self_attn/Unsqueeze_29_output_0'/blocks.22/self_attn/Concat_11_output_0/blocks.22/self_attn/Concat_11"Concat* axis  &/blocks.22/self_attn/Expand_1_output_0 '/blocks.22/self_attn/Concat_11_output_0'/blocks.22/self_attn/Reshape_6_output_0/blocks.22/self_attn/Reshape_6"Reshape* allowzero  '/blocks.22/self_attn/Transpose_output_0 '/blocks.22/self_attn/Reshape_4_output_0$/blocks.22/self_attn/MatMul_output_0/blocks.22/self_attn/MatMul"MatMul )/blocks.22/self_attn/Constant_56_output_0 /blocks.22/self_attn/Constant_56"Constant*B value*6B,/blocks.22/self_attn/Constant_56_attr::valueJ5A  $/blocks.22/self_attn/MatMul_output_0 )/blocks.22/self_attn/Constant_56_output_0#/blocks.22/self_attn/Div_2_output_0/blocks.22/self_attn/Div_2"Div { #/blocks.22/self_attn/Div_2_output_0 attention_mask#/blocks.22/self_attn/Add_2_output_0/blocks.22/self_attn/Add_2"Add  #/blocks.22/self_attn/Add_2_output_0%/blocks.22/self_attn/Softmax_output_0/blocks.22/self_attn/Softmax"Softmax* axis { %/blocks.22/self_attn/Softmax_output_0$/blocks.22/self_attn/Cast_4_output_0/blocks.22/self_attn/Cast_4"Cast* to  $/blocks.22/self_attn/Cast_4_output_0 '/blocks.22/self_attn/Reshape_6_output_0&/blocks.22/self_attn/MatMul_1_output_0/blocks.22/self_attn/MatMul_1"MatMul  &/blocks.22/self_attn/MatMul_1_output_0)/blocks.22/self_attn/Transpose_3_output_0 /blocks.22/self_attn/Transpose_3" Transpose* perm@@@@ fonnx::Unsqueeze_6997 Constant_8543"Constant*5 value*)BConstant_8543_attr::valueJ  $/blocks.22/self_attn/Gather_output_0 onnx::Unsqueeze_6997*/blocks.22/self_attn/Unsqueeze_30_output_0!/blocks.22/self_attn/Unsqueeze_30" Unsqueeze fonnx::Unsqueeze_6999 Constant_8545"Constant*5 value*)BConstant_8545_attr::valueJ  &/blocks.22/self_attn/Gather_1_output_0 onnx::Unsqueeze_6999*/blocks.22/self_attn/Unsqueeze_31_output_0!/blocks.22/self_attn/Unsqueeze_31" Unsqueeze )/blocks.22/self_attn/Constant_57_output_0 /blocks.22/self_attn/Constant_57"Constant*H value*<B,/blocks.22/self_attn/Constant_57_attr::valueJ  */blocks.22/self_attn/Unsqueeze_30_output_0 */blocks.22/self_attn/Unsqueeze_31_output_0 )/blocks.22/self_attn/Constant_57_output_0'/blocks.22/self_attn/Concat_12_output_0/blocks.22/self_attn/Concat_12"Concat* axis  )/blocks.22/self_attn/Transpose_3_output_0 '/blocks.22/self_attn/Concat_12_output_0'/blocks.22/self_attn/Reshape_7_output_0/blocks.22/self_attn/Reshape_7"Reshape* allowzero  '/blocks.22/self_attn/Reshape_7_output_0 onnx::MatMul_9205+/blocks.22/self_attn/o_proj/MatMul_output_0"/blocks.22/self_attn/o_proj/MatMul"MatMul  */blocks.22/input_layernorm/Cast_1_output_0 +/blocks.22/self_attn/o_proj/MatMul_output_0/blocks.22/Add_output_0/blocks.22/Add"Add  /blocks.22/Add_output_01/blocks.22/post_attention_layernorm/Cast_output_0(/blocks.22/post_attention_layernorm/Cast"Cast* to 5/blocks.22/post_attention_layernorm/Constant_output_0,/blocks.22/post_attention_layernorm/Constant"Constant*N value*BB8/blocks.22/post_attention_layernorm/Constant_attr::valueJ@  1/blocks.22/post_attention_layernorm/Cast_output_0 5/blocks.22/post_attention_layernorm/Constant_output_00/blocks.22/post_attention_layernorm/Pow_output_0'/blocks.22/post_attention_layernorm/Pow"Pow  0/blocks.22/post_attention_layernorm/Pow_output_07/blocks.22/post_attention_layernorm/ReduceMean_output_0./blocks.22/post_attention_layernorm/ReduceMean" ReduceMean* axes@* keepdims 7/blocks.22/post_attention_layernorm/Constant_1_output_0./blocks.22/post_attention_layernorm/Constant_1"Constant*P value*DB:/blocks.22/post_attention_layernorm/Constant_1_attr::valueJ75  7/blocks.22/post_attention_layernorm/ReduceMean_output_0 7/blocks.22/post_attention_layernorm/Constant_1_output_00/blocks.22/post_attention_layernorm/Add_output_0'/blocks.22/post_attention_layernorm/Add"Add  0/blocks.22/post_attention_layernorm/Add_output_01/blocks.22/post_attention_layernorm/Sqrt_output_0(/blocks.22/post_attention_layernorm/Sqrt"Sqrt 7/blocks.22/post_attention_layernorm/Constant_2_output_0./blocks.22/post_attention_layernorm/Constant_2"Constant*P value*DB:/blocks.22/post_attention_layernorm/Constant_2_attr::valueJ?  7/blocks.22/post_attention_layernorm/Constant_2_output_0 1/blocks.22/post_attention_layernorm/Sqrt_output_00/blocks.22/post_attention_layernorm/Div_output_0'/blocks.22/post_attention_layernorm/Div"Div  1/blocks.22/post_attention_layernorm/Cast_output_03/blocks.22/post_attention_layernorm/Cast_1_output_0*/blocks.22/post_attention_layernorm/Cast_1"Cast* to  3/blocks.22/post_attention_layernorm/Cast_1_output_0 0/blocks.22/post_attention_layernorm/Div_output_00/blocks.22/post_attention_layernorm/Mul_output_0'/blocks.22/post_attention_layernorm/Mul"Mul  0/blocks.22/post_attention_layernorm/Mul_output_0 )blocks.22.post_attention_layernorm.weight2/blocks.22/post_attention_layernorm/Mul_1_output_0)/blocks.22/post_attention_layernorm/Mul_1"Mul  2/blocks.22/post_attention_layernorm/Mul_1_output_03/blocks.22/post_attention_layernorm/Cast_2_output_0*/blocks.22/post_attention_layernorm/Cast_2"Cast* to  3/blocks.22/post_attention_layernorm/Cast_2_output_0 onnx::MatMul_9206(/blocks.22/mlp/gate_proj/MatMul_output_0/blocks.22/mlp/gate_proj/MatMul"MatMul z (/blocks.22/mlp/gate_proj/MatMul_output_0&/blocks.22/mlp/act_fn/Sigmoid_output_0/blocks.22/mlp/act_fn/Sigmoid"Sigmoid  (/blocks.22/mlp/gate_proj/MatMul_output_0 &/blocks.22/mlp/act_fn/Sigmoid_output_0"/blocks.22/mlp/act_fn/Mul_output_0/blocks.22/mlp/act_fn/Mul"Mul  3/blocks.22/post_attention_layernorm/Cast_2_output_0 onnx::MatMul_9207&/blocks.22/mlp/up_proj/MatMul_output_0/blocks.22/mlp/up_proj/MatMul"MatMul  "/blocks.22/mlp/act_fn/Mul_output_0 &/blocks.22/mlp/up_proj/MatMul_output_0/blocks.22/mlp/Mul_output_0/blocks.22/mlp/Mul"Mul  /blocks.22/mlp/Mul_output_0 onnx::MatMul_9208(/blocks.22/mlp/down_proj/MatMul_output_0/blocks.22/mlp/down_proj/MatMul"MatMul  3/blocks.22/post_attention_layernorm/Cast_1_output_0 (/blocks.22/mlp/down_proj/MatMul_output_0/blocks.22/Add_1_output_0/blocks.22/Add_1"Add c/Constant_15_output_0 /Constant_15"Constant*2 value*&B/Constant_15_attr::valueJ ^ past_key_values /Constant_15_output_0/Gather_23_output_0 /Gather_23"Gather* axis /blocks.23/Constant_output_0/blocks.23/Constant"Constant*K value*?B/blocks.23/Constant_attr::valueJ  /blocks.22/Add_1_output_0 /blocks.23/Constant_output_0/blocks.23/Reshape_output_0/blocks.23/Reshape"Reshape* allowzero y /blocks.23/Reshape_output_0(/blocks.23/input_layernorm/Cast_output_0/blocks.23/input_layernorm/Cast"Cast* to ,/blocks.23/input_layernorm/Constant_output_0#/blocks.23/input_layernorm/Constant"Constant*E value*9B//blocks.23/input_layernorm/Constant_attr::valueJ@  (/blocks.23/input_layernorm/Cast_output_0 ,/blocks.23/input_layernorm/Constant_output_0'/blocks.23/input_layernorm/Pow_output_0/blocks.23/input_layernorm/Pow"Pow  '/blocks.23/input_layernorm/Pow_output_0./blocks.23/input_layernorm/ReduceMean_output_0%/blocks.23/input_layernorm/ReduceMean" ReduceMean* axes@* keepdims ./blocks.23/input_layernorm/Constant_1_output_0%/blocks.23/input_layernorm/Constant_1"Constant*G value*;B1/blocks.23/input_layernorm/Constant_1_attr::valueJ75  ./blocks.23/input_layernorm/ReduceMean_output_0 ./blocks.23/input_layernorm/Constant_1_output_0'/blocks.23/input_layernorm/Add_output_0/blocks.23/input_layernorm/Add"Add z '/blocks.23/input_layernorm/Add_output_0(/blocks.23/input_layernorm/Sqrt_output_0/blocks.23/input_layernorm/Sqrt"Sqrt ./blocks.23/input_layernorm/Constant_2_output_0%/blocks.23/input_layernorm/Constant_2"Constant*G value*;B1/blocks.23/input_layernorm/Constant_2_attr::valueJ?  ./blocks.23/input_layernorm/Constant_2_output_0 (/blocks.23/input_layernorm/Sqrt_output_0'/blocks.23/input_layernorm/Div_output_0/blocks.23/input_layernorm/Div"Div  (/blocks.23/input_layernorm/Cast_output_0*/blocks.23/input_layernorm/Cast_1_output_0!/blocks.23/input_layernorm/Cast_1"Cast* to  */blocks.23/input_layernorm/Cast_1_output_0 '/blocks.23/input_layernorm/Div_output_0'/blocks.23/input_layernorm/Mul_output_0/blocks.23/input_layernorm/Mul"Mul  '/blocks.23/input_layernorm/Mul_output_0 blocks.23.input_layernorm.weight)/blocks.23/input_layernorm/Mul_1_output_0 /blocks.23/input_layernorm/Mul_1"Mul  )/blocks.23/input_layernorm/Mul_1_output_0*/blocks.23/input_layernorm/Cast_2_output_0!/blocks.23/input_layernorm/Cast_2"Cast* to t */blocks.23/input_layernorm/Cast_2_output_0#/blocks.23/self_attn/Shape_output_0/blocks.23/self_attn/Shape"Shape &/blocks.23/self_attn/Constant_output_0/blocks.23/self_attn/Constant"Constant*C value*7B)/blocks.23/self_attn/Constant_attr::valueJ  #/blocks.23/self_attn/Shape_output_0 &/blocks.23/self_attn/Constant_output_0$/blocks.23/self_attn/Gather_output_0/blocks.23/self_attn/Gather"Gather* axis x */blocks.23/input_layernorm/Cast_2_output_0%/blocks.23/self_attn/Shape_1_output_0/blocks.23/self_attn/Shape_1"Shape (/blocks.23/self_attn/Constant_1_output_0/blocks.23/self_attn/Constant_1"Constant*E value*9B+/blocks.23/self_attn/Constant_1_attr::valueJ  %/blocks.23/self_attn/Shape_1_output_0 (/blocks.23/self_attn/Constant_1_output_0&/blocks.23/self_attn/Gather_1_output_0/blocks.23/self_attn/Gather_1"Gather* axis  */blocks.23/input_layernorm/Cast_2_output_0 onnx::MatMul_9209+/blocks.23/self_attn/q_proj/MatMul_output_0"/blocks.23/self_attn/q_proj/MatMul"MatMul  */blocks.23/input_layernorm/Cast_2_output_0 onnx::MatMul_9210+/blocks.23/self_attn/k_proj/MatMul_output_0"/blocks.23/self_attn/k_proj/MatMul"MatMul  */blocks.23/input_layernorm/Cast_2_output_0 onnx::MatMul_9211+/blocks.23/self_attn/v_proj/MatMul_output_0"/blocks.23/self_attn/v_proj/MatMul"MatMul fonnx::Unsqueeze_7060 Constant_8598"Constant*5 value*)BConstant_8598_attr::valueJ  $/blocks.23/self_attn/Gather_output_0 onnx::Unsqueeze_7060'/blocks.23/self_attn/Unsqueeze_output_0/blocks.23/self_attn/Unsqueeze" Unsqueeze fonnx::Unsqueeze_7062 Constant_8600"Constant*5 value*)BConstant_8600_attr::valueJ  &/blocks.23/self_attn/Gather_1_output_0 onnx::Unsqueeze_7062)/blocks.23/self_attn/Unsqueeze_1_output_0 /blocks.23/self_attn/Unsqueeze_1" Unsqueeze (/blocks.23/self_attn/Constant_2_output_0/blocks.23/self_attn/Constant_2"Constant*G value*;B+/blocks.23/self_attn/Constant_2_attr::valueJ (/blocks.23/self_attn/Constant_3_output_0/blocks.23/self_attn/Constant_3"Constant*G value*;B+/blocks.23/self_attn/Constant_3_attr::valueJ  '/blocks.23/self_attn/Unsqueeze_output_0 )/blocks.23/self_attn/Unsqueeze_1_output_0 (/blocks.23/self_attn/Constant_2_output_0 (/blocks.23/self_attn/Constant_3_output_0$/blocks.23/self_attn/Concat_output_0/blocks.23/self_attn/Concat"Concat* axis  +/blocks.23/self_attn/q_proj/MatMul_output_0 $/blocks.23/self_attn/Concat_output_0%/blocks.23/self_attn/Reshape_output_0/blocks.23/self_attn/Reshape"Reshape* allowzero fonnx::Unsqueeze_7070 Constant_8606"Constant*5 value*)BConstant_8606_attr::valueJ  $/blocks.23/self_attn/Gather_output_0 onnx::Unsqueeze_7070)/blocks.23/self_attn/Unsqueeze_2_output_0 /blocks.23/self_attn/Unsqueeze_2" Unsqueeze fonnx::Unsqueeze_7072 Constant_8608"Constant*5 value*)BConstant_8608_attr::valueJ  &/blocks.23/self_attn/Gather_1_output_0 onnx::Unsqueeze_7072)/blocks.23/self_attn/Unsqueeze_3_output_0 /blocks.23/self_attn/Unsqueeze_3" Unsqueeze (/blocks.23/self_attn/Constant_4_output_0/blocks.23/self_attn/Constant_4"Constant*G value*;B+/blocks.23/self_attn/Constant_4_attr::valueJ (/blocks.23/self_attn/Constant_5_output_0/blocks.23/self_attn/Constant_5"Constant*G value*;B+/blocks.23/self_attn/Constant_5_attr::valueJ  )/blocks.23/self_attn/Unsqueeze_2_output_0 )/blocks.23/self_attn/Unsqueeze_3_output_0 (/blocks.23/self_attn/Constant_4_output_0 (/blocks.23/self_attn/Constant_5_output_0&/blocks.23/self_attn/Concat_1_output_0/blocks.23/self_attn/Concat_1"Concat* axis fonnx::Unsqueeze_7079 Constant_8613"Constant*5 value*)BConstant_8613_attr::valueJ  $/blocks.23/self_attn/Gather_output_0 onnx::Unsqueeze_7079)/blocks.23/self_attn/Unsqueeze_4_output_0 /blocks.23/self_attn/Unsqueeze_4" Unsqueeze fonnx::Unsqueeze_7081 Constant_8615"Constant*5 value*)BConstant_8615_attr::valueJ  &/blocks.23/self_attn/Gather_1_output_0 onnx::Unsqueeze_7081)/blocks.23/self_attn/Unsqueeze_5_output_0 /blocks.23/self_attn/Unsqueeze_5" Unsqueeze (/blocks.23/self_attn/Constant_6_output_0/blocks.23/self_attn/Constant_6"Constant*G value*;B+/blocks.23/self_attn/Constant_6_attr::valueJ (/blocks.23/self_attn/Constant_7_output_0/blocks.23/self_attn/Constant_7"Constant*G value*;B+/blocks.23/self_attn/Constant_7_attr::valueJ  )/blocks.23/self_attn/Unsqueeze_4_output_0 )/blocks.23/self_attn/Unsqueeze_5_output_0 (/blocks.23/self_attn/Constant_6_output_0 (/blocks.23/self_attn/Constant_7_output_0&/blocks.23/self_attn/Concat_2_output_0/blocks.23/self_attn/Concat_2"Concat* axis  +/blocks.23/self_attn/k_proj/MatMul_output_0 &/blocks.23/self_attn/Concat_1_output_0'/blocks.23/self_attn/Reshape_1_output_0/blocks.23/self_attn/Reshape_1"Reshape* allowzero  +/blocks.23/self_attn/v_proj/MatMul_output_0 &/blocks.23/self_attn/Concat_2_output_0'/blocks.23/self_attn/Reshape_2_output_0/blocks.23/self_attn/Reshape_2"Reshape* allowzero  %/blocks.23/self_attn/Reshape_output_0)/blocks.23/self_attn/q_norm/Cast_output_0 /blocks.23/self_attn/q_norm/Cast"Cast* to -/blocks.23/self_attn/q_norm/Constant_output_0$/blocks.23/self_attn/q_norm/Constant"Constant*F value*:B0/blocks.23/self_attn/q_norm/Constant_attr::valueJ@  )/blocks.23/self_attn/q_norm/Cast_output_0 -/blocks.23/self_attn/q_norm/Constant_output_0(/blocks.23/self_attn/q_norm/Pow_output_0/blocks.23/self_attn/q_norm/Pow"Pow  (/blocks.23/self_attn/q_norm/Pow_output_0//blocks.23/self_attn/q_norm/ReduceMean_output_0&/blocks.23/self_attn/q_norm/ReduceMean" ReduceMean* axes@* keepdims //blocks.23/self_attn/q_norm/Constant_1_output_0&/blocks.23/self_attn/q_norm/Constant_1"Constant*H value*<B2/blocks.23/self_attn/q_norm/Constant_1_attr::valueJ75  //blocks.23/self_attn/q_norm/ReduceMean_output_0 //blocks.23/self_attn/q_norm/Constant_1_output_0(/blocks.23/self_attn/q_norm/Add_output_0/blocks.23/self_attn/q_norm/Add"Add } (/blocks.23/self_attn/q_norm/Add_output_0)/blocks.23/self_attn/q_norm/Sqrt_output_0 /blocks.23/self_attn/q_norm/Sqrt"Sqrt //blocks.23/self_attn/q_norm/Constant_2_output_0&/blocks.23/self_attn/q_norm/Constant_2"Constant*H value*<B2/blocks.23/self_attn/q_norm/Constant_2_attr::valueJ?  //blocks.23/self_attn/q_norm/Constant_2_output_0 )/blocks.23/self_attn/q_norm/Sqrt_output_0(/blocks.23/self_attn/q_norm/Div_output_0/blocks.23/self_attn/q_norm/Div"Div  )/blocks.23/self_attn/q_norm/Cast_output_0+/blocks.23/self_attn/q_norm/Cast_1_output_0"/blocks.23/self_attn/q_norm/Cast_1"Cast* to  +/blocks.23/self_attn/q_norm/Cast_1_output_0 (/blocks.23/self_attn/q_norm/Div_output_0(/blocks.23/self_attn/q_norm/Mul_output_0/blocks.23/self_attn/q_norm/Mul"Mul  (/blocks.23/self_attn/q_norm/Mul_output_0 !blocks.23.self_attn.q_norm.weight*/blocks.23/self_attn/q_norm/Mul_1_output_0!/blocks.23/self_attn/q_norm/Mul_1"Mul  */blocks.23/self_attn/q_norm/Mul_1_output_0+/blocks.23/self_attn/q_norm/Cast_2_output_0"/blocks.23/self_attn/q_norm/Cast_2"Cast* to  '/blocks.23/self_attn/Reshape_1_output_0)/blocks.23/self_attn/k_norm/Cast_output_0 /blocks.23/self_attn/k_norm/Cast"Cast* to -/blocks.23/self_attn/k_norm/Constant_output_0$/blocks.23/self_attn/k_norm/Constant"Constant*F value*:B0/blocks.23/self_attn/k_norm/Constant_attr::valueJ@  )/blocks.23/self_attn/k_norm/Cast_output_0 -/blocks.23/self_attn/k_norm/Constant_output_0(/blocks.23/self_attn/k_norm/Pow_output_0/blocks.23/self_attn/k_norm/Pow"Pow  (/blocks.23/self_attn/k_norm/Pow_output_0//blocks.23/self_attn/k_norm/ReduceMean_output_0&/blocks.23/self_attn/k_norm/ReduceMean" ReduceMean* axes@* keepdims //blocks.23/self_attn/k_norm/Constant_1_output_0&/blocks.23/self_attn/k_norm/Constant_1"Constant*H value*<B2/blocks.23/self_attn/k_norm/Constant_1_attr::valueJ75  //blocks.23/self_attn/k_norm/ReduceMean_output_0 //blocks.23/self_attn/k_norm/Constant_1_output_0(/blocks.23/self_attn/k_norm/Add_output_0/blocks.23/self_attn/k_norm/Add"Add } (/blocks.23/self_attn/k_norm/Add_output_0)/blocks.23/self_attn/k_norm/Sqrt_output_0 /blocks.23/self_attn/k_norm/Sqrt"Sqrt //blocks.23/self_attn/k_norm/Constant_2_output_0&/blocks.23/self_attn/k_norm/Constant_2"Constant*H value*<B2/blocks.23/self_attn/k_norm/Constant_2_attr::valueJ?  //blocks.23/self_attn/k_norm/Constant_2_output_0 )/blocks.23/self_attn/k_norm/Sqrt_output_0(/blocks.23/self_attn/k_norm/Div_output_0/blocks.23/self_attn/k_norm/Div"Div  )/blocks.23/self_attn/k_norm/Cast_output_0+/blocks.23/self_attn/k_norm/Cast_1_output_0"/blocks.23/self_attn/k_norm/Cast_1"Cast* to  +/blocks.23/self_attn/k_norm/Cast_1_output_0 (/blocks.23/self_attn/k_norm/Div_output_0(/blocks.23/self_attn/k_norm/Mul_output_0/blocks.23/self_attn/k_norm/Mul"Mul  (/blocks.23/self_attn/k_norm/Mul_output_0 !blocks.23.self_attn.k_norm.weight*/blocks.23/self_attn/k_norm/Mul_1_output_0!/blocks.23/self_attn/k_norm/Mul_1"Mul  */blocks.23/self_attn/k_norm/Mul_1_output_0+/blocks.23/self_attn/k_norm/Cast_2_output_0"/blocks.23/self_attn/k_norm/Cast_2"Cast* to  +/blocks.23/self_attn/q_norm/Cast_2_output_0 %/blocks.0/self_attn/Gather_2_output_0!/blocks.23/self_attn/Mul_output_0/blocks.23/self_attn/Mul"Mul y +/blocks.23/self_attn/q_norm/Cast_2_output_0%/blocks.23/self_attn/Shape_2_output_0/blocks.23/self_attn/Shape_2"Shape (/blocks.23/self_attn/Constant_8_output_0/blocks.23/self_attn/Constant_8"Constant*E value*9B+/blocks.23/self_attn/Constant_8_attr::valueJ  %/blocks.23/self_attn/Shape_2_output_0 (/blocks.23/self_attn/Constant_8_output_0&/blocks.23/self_attn/Gather_2_output_0/blocks.23/self_attn/Gather_2"Gather* axis (/blocks.23/self_attn/Constant_9_output_0/blocks.23/self_attn/Constant_9"Constant*E value*9B+/blocks.23/self_attn/Constant_9_attr::valueJ  &/blocks.23/self_attn/Gather_2_output_0 (/blocks.23/self_attn/Constant_9_output_0!/blocks.23/self_attn/Div_output_0/blocks.23/self_attn/Div"Div s !/blocks.23/self_attn/Div_output_0"/blocks.23/self_attn/Cast_output_0/blocks.23/self_attn/Cast"Cast* to x "/blocks.23/self_attn/Cast_output_0$/blocks.23/self_attn/Cast_1_output_0/blocks.23/self_attn/Cast_1"Cast* to )/blocks.23/self_attn/Constant_10_output_0 /blocks.23/self_attn/Constant_10"Constant*H value*<B,/blocks.23/self_attn/Constant_10_attr::valueJ )/blocks.23/self_attn/Constant_11_output_0 /blocks.23/self_attn/Constant_11"Constant*H value*<B,/blocks.23/self_attn/Constant_11_attr::valueJ )/blocks.23/self_attn/Constant_12_output_0 /blocks.23/self_attn/Constant_12"Constant*H value*<B,/blocks.23/self_attn/Constant_12_attr::valueJ  $/blocks.23/self_attn/Cast_1_output_0 )/blocks.23/self_attn/Constant_12_output_0)/blocks.23/self_attn/Unsqueeze_6_output_0 /blocks.23/self_attn/Unsqueeze_6" Unsqueeze )/blocks.23/self_attn/Constant_13_output_0 /blocks.23/self_attn/Constant_13"Constant*H value*<B,/blocks.23/self_attn/Constant_13_attr::valueJ  +/blocks.23/self_attn/q_norm/Cast_2_output_0 )/blocks.23/self_attn/Constant_11_output_0 )/blocks.23/self_attn/Unsqueeze_6_output_0 )/blocks.23/self_attn/Constant_10_output_0 )/blocks.23/self_attn/Constant_13_output_0#/blocks.23/self_attn/Slice_output_0/blocks.23/self_attn/Slice"Slice )/blocks.23/self_attn/Constant_14_output_0 /blocks.23/self_attn/Constant_14"Constant*H value*<B,/blocks.23/self_attn/Constant_14_attr::valueJ )/blocks.23/self_attn/Constant_15_output_0 /blocks.23/self_attn/Constant_15"Constant*H value*<B,/blocks.23/self_attn/Constant_15_attr::valueJ  $/blocks.23/self_attn/Cast_1_output_0 )/blocks.23/self_attn/Constant_15_output_0)/blocks.23/self_attn/Unsqueeze_7_output_0 /blocks.23/self_attn/Unsqueeze_7" Unsqueeze )/blocks.23/self_attn/Constant_16_output_0 /blocks.23/self_attn/Constant_16"Constant*H value*<B,/blocks.23/self_attn/Constant_16_attr::valueJ )/blocks.23/self_attn/Constant_17_output_0 /blocks.23/self_attn/Constant_17"Constant*H value*<B,/blocks.23/self_attn/Constant_17_attr::valueJ  +/blocks.23/self_attn/q_norm/Cast_2_output_0 )/blocks.23/self_attn/Unsqueeze_7_output_0 )/blocks.23/self_attn/Constant_16_output_0 )/blocks.23/self_attn/Constant_14_output_0 )/blocks.23/self_attn/Constant_17_output_0%/blocks.23/self_attn/Slice_1_output_0/blocks.23/self_attn/Slice_1"Slice i %/blocks.23/self_attn/Slice_1_output_0!/blocks.23/self_attn/Neg_output_0/blocks.23/self_attn/Neg"Neg  !/blocks.23/self_attn/Neg_output_0 #/blocks.23/self_attn/Slice_output_0&/blocks.23/self_attn/Concat_3_output_0/blocks.23/self_attn/Concat_3"Concat* axis  &/blocks.23/self_attn/Concat_3_output_0 %/blocks.0/self_attn/Gather_3_output_0#/blocks.23/self_attn/Mul_1_output_0/blocks.23/self_attn/Mul_1"Mul  !/blocks.23/self_attn/Mul_output_0 #/blocks.23/self_attn/Mul_1_output_0!/blocks.23/self_attn/Add_output_0/blocks.23/self_attn/Add"Add  +/blocks.23/self_attn/k_norm/Cast_2_output_0 %/blocks.0/self_attn/Gather_2_output_0#/blocks.23/self_attn/Mul_2_output_0/blocks.23/self_attn/Mul_2"Mul y +/blocks.23/self_attn/k_norm/Cast_2_output_0%/blocks.23/self_attn/Shape_3_output_0/blocks.23/self_attn/Shape_3"Shape )/blocks.23/self_attn/Constant_18_output_0 /blocks.23/self_attn/Constant_18"Constant*F value*:B,/blocks.23/self_attn/Constant_18_attr::valueJ  %/blocks.23/self_attn/Shape_3_output_0 )/blocks.23/self_attn/Constant_18_output_0&/blocks.23/self_attn/Gather_3_output_0/blocks.23/self_attn/Gather_3"Gather* axis )/blocks.23/self_attn/Constant_19_output_0 /blocks.23/self_attn/Constant_19"Constant*F value*:B,/blocks.23/self_attn/Constant_19_attr::valueJ  &/blocks.23/self_attn/Gather_3_output_0 )/blocks.23/self_attn/Constant_19_output_0#/blocks.23/self_attn/Div_1_output_0/blocks.23/self_attn/Div_1"Div y #/blocks.23/self_attn/Div_1_output_0$/blocks.23/self_attn/Cast_2_output_0/blocks.23/self_attn/Cast_2"Cast* to z $/blocks.23/self_attn/Cast_2_output_0$/blocks.23/self_attn/Cast_3_output_0/blocks.23/self_attn/Cast_3"Cast* to )/blocks.23/self_attn/Constant_20_output_0 /blocks.23/self_attn/Constant_20"Constant*H value*<B,/blocks.23/self_attn/Constant_20_attr::valueJ )/blocks.23/self_attn/Constant_21_output_0 /blocks.23/self_attn/Constant_21"Constant*H value*<B,/blocks.23/self_attn/Constant_21_attr::valueJ )/blocks.23/self_attn/Constant_22_output_0 /blocks.23/self_attn/Constant_22"Constant*H value*<B,/blocks.23/self_attn/Constant_22_attr::valueJ  $/blocks.23/self_attn/Cast_3_output_0 )/blocks.23/self_attn/Constant_22_output_0)/blocks.23/self_attn/Unsqueeze_8_output_0 /blocks.23/self_attn/Unsqueeze_8" Unsqueeze )/blocks.23/self_attn/Constant_23_output_0 /blocks.23/self_attn/Constant_23"Constant*H value*<B,/blocks.23/self_attn/Constant_23_attr::valueJ  +/blocks.23/self_attn/k_norm/Cast_2_output_0 )/blocks.23/self_attn/Constant_21_output_0 )/blocks.23/self_attn/Unsqueeze_8_output_0 )/blocks.23/self_attn/Constant_20_output_0 )/blocks.23/self_attn/Constant_23_output_0%/blocks.23/self_attn/Slice_2_output_0/blocks.23/self_attn/Slice_2"Slice )/blocks.23/self_attn/Constant_24_output_0 /blocks.23/self_attn/Constant_24"Constant*H value*<B,/blocks.23/self_attn/Constant_24_attr::valueJ )/blocks.23/self_attn/Constant_25_output_0 /blocks.23/self_attn/Constant_25"Constant*H value*<B,/blocks.23/self_attn/Constant_25_attr::valueJ  $/blocks.23/self_attn/Cast_3_output_0 )/blocks.23/self_attn/Constant_25_output_0)/blocks.23/self_attn/Unsqueeze_9_output_0 /blocks.23/self_attn/Unsqueeze_9" Unsqueeze )/blocks.23/self_attn/Constant_26_output_0 /blocks.23/self_attn/Constant_26"Constant*H value*<B,/blocks.23/self_attn/Constant_26_attr::valueJ )/blocks.23/self_attn/Constant_27_output_0 /blocks.23/self_attn/Constant_27"Constant*H value*<B,/blocks.23/self_attn/Constant_27_attr::valueJ  +/blocks.23/self_attn/k_norm/Cast_2_output_0 )/blocks.23/self_attn/Unsqueeze_9_output_0 )/blocks.23/self_attn/Constant_26_output_0 )/blocks.23/self_attn/Constant_24_output_0 )/blocks.23/self_attn/Constant_27_output_0%/blocks.23/self_attn/Slice_3_output_0/blocks.23/self_attn/Slice_3"Slice m %/blocks.23/self_attn/Slice_3_output_0#/blocks.23/self_attn/Neg_1_output_0/blocks.23/self_attn/Neg_1"Neg  #/blocks.23/self_attn/Neg_1_output_0 %/blocks.23/self_attn/Slice_2_output_0&/blocks.23/self_attn/Concat_4_output_0/blocks.23/self_attn/Concat_4"Concat* axis  &/blocks.23/self_attn/Concat_4_output_0 %/blocks.0/self_attn/Gather_3_output_0#/blocks.23/self_attn/Mul_3_output_0/blocks.23/self_attn/Mul_3"Mul  #/blocks.23/self_attn/Mul_2_output_0 #/blocks.23/self_attn/Mul_3_output_0#/blocks.23/self_attn/Add_1_output_0/blocks.23/self_attn/Add_1"Add  /Gather_23_output_0 /rotary/Constant_3_output_0&/blocks.23/self_attn/Gather_4_output_0/blocks.23/self_attn/Gather_4"Gather* axis  /Gather_23_output_0 /rotary/Constant_8_output_0&/blocks.23/self_attn/Gather_5_output_0/blocks.23/self_attn/Gather_5"Gather* axis  &/blocks.23/self_attn/Gather_4_output_0 #/blocks.23/self_attn/Add_1_output_0&/blocks.23/self_attn/Concat_5_output_0/blocks.23/self_attn/Concat_5"Concat* axis  &/blocks.23/self_attn/Gather_5_output_0 '/blocks.23/self_attn/Reshape_2_output_0&/blocks.23/self_attn/Concat_6_output_0/blocks.23/self_attn/Concat_6"Concat* axis )/blocks.23/self_attn/Constant_28_output_0 /blocks.23/self_attn/Constant_28"Constant*H value*<B,/blocks.23/self_attn/Constant_28_attr::valueJ  &/blocks.23/self_attn/Concat_5_output_0 )/blocks.23/self_attn/Constant_28_output_0*/blocks.23/self_attn/Unsqueeze_10_output_0!/blocks.23/self_attn/Unsqueeze_10" Unsqueeze )/blocks.23/self_attn/Constant_29_output_0 /blocks.23/self_attn/Constant_29"Constant*H value*<B,/blocks.23/self_attn/Constant_29_attr::valueJ  &/blocks.23/self_attn/Concat_6_output_0 )/blocks.23/self_attn/Constant_29_output_0*/blocks.23/self_attn/Unsqueeze_11_output_0!/blocks.23/self_attn/Unsqueeze_11" Unsqueeze  */blocks.23/self_attn/Unsqueeze_10_output_0 */blocks.23/self_attn/Unsqueeze_11_output_0&/blocks.23/self_attn/Concat_7_output_0/blocks.23/self_attn/Concat_7"Concat* axis  !/blocks.23/self_attn/Add_output_0'/blocks.23/self_attn/Transpose_output_0/blocks.23/self_attn/Transpose" Transpose* perm@@@@  &/blocks.23/self_attn/Concat_5_output_0)/blocks.23/self_attn/Transpose_1_output_0 /blocks.23/self_attn/Transpose_1" Transpose* perm@@@@  &/blocks.23/self_attn/Concat_6_output_0)/blocks.23/self_attn/Transpose_2_output_0 /blocks.23/self_attn/Transpose_2" Transpose* perm@@@@ w )/blocks.23/self_attn/Transpose_1_output_0%/blocks.23/self_attn/Shape_4_output_0/blocks.23/self_attn/Shape_4"Shape )/blocks.23/self_attn/Constant_30_output_0 /blocks.23/self_attn/Constant_30"Constant*F value*:B,/blocks.23/self_attn/Constant_30_attr::valueJ  %/blocks.23/self_attn/Shape_4_output_0 )/blocks.23/self_attn/Constant_30_output_0&/blocks.23/self_attn/Gather_6_output_0/blocks.23/self_attn/Gather_6"Gather* axis w )/blocks.23/self_attn/Transpose_1_output_0%/blocks.23/self_attn/Shape_5_output_0/blocks.23/self_attn/Shape_5"Shape )/blocks.23/self_attn/Constant_31_output_0 /blocks.23/self_attn/Constant_31"Constant*F value*:B,/blocks.23/self_attn/Constant_31_attr::valueJ  %/blocks.23/self_attn/Shape_5_output_0 )/blocks.23/self_attn/Constant_31_output_0&/blocks.23/self_attn/Gather_7_output_0/blocks.23/self_attn/Gather_7"Gather* axis w )/blocks.23/self_attn/Transpose_1_output_0%/blocks.23/self_attn/Shape_6_output_0/blocks.23/self_attn/Shape_6"Shape )/blocks.23/self_attn/Constant_32_output_0 /blocks.23/self_attn/Constant_32"Constant*F value*:B,/blocks.23/self_attn/Constant_32_attr::valueJ  %/blocks.23/self_attn/Shape_6_output_0 )/blocks.23/self_attn/Constant_32_output_0&/blocks.23/self_attn/Gather_8_output_0/blocks.23/self_attn/Gather_8"Gather* axis w )/blocks.23/self_attn/Transpose_1_output_0%/blocks.23/self_attn/Shape_7_output_0/blocks.23/self_attn/Shape_7"Shape )/blocks.23/self_attn/Constant_33_output_0 /blocks.23/self_attn/Constant_33"Constant*F value*:B,/blocks.23/self_attn/Constant_33_attr::valueJ  %/blocks.23/self_attn/Shape_7_output_0 )/blocks.23/self_attn/Constant_33_output_0&/blocks.23/self_attn/Gather_9_output_0/blocks.23/self_attn/Gather_9"Gather* axis )/blocks.23/self_attn/Constant_34_output_0 /blocks.23/self_attn/Constant_34"Constant*H value*<B,/blocks.23/self_attn/Constant_34_attr::valueJ  )/blocks.23/self_attn/Transpose_1_output_0 )/blocks.23/self_attn/Constant_34_output_0*/blocks.23/self_attn/Unsqueeze_12_output_0!/blocks.23/self_attn/Unsqueeze_12" Unsqueeze )/blocks.23/self_attn/Constant_35_output_0 /blocks.23/self_attn/Constant_35"Constant*H value*<B,/blocks.23/self_attn/Constant_35_attr::valueJ  &/blocks.23/self_attn/Gather_6_output_0 )/blocks.23/self_attn/Constant_35_output_0*/blocks.23/self_attn/Unsqueeze_13_output_0!/blocks.23/self_attn/Unsqueeze_13" Unsqueeze )/blocks.23/self_attn/Constant_36_output_0 /blocks.23/self_attn/Constant_36"Constant*H value*<B,/blocks.23/self_attn/Constant_36_attr::valueJ  &/blocks.23/self_attn/Gather_7_output_0 )/blocks.23/self_attn/Constant_36_output_0*/blocks.23/self_attn/Unsqueeze_14_output_0!/blocks.23/self_attn/Unsqueeze_14" Unsqueeze )/blocks.23/self_attn/Constant_37_output_0 /blocks.23/self_attn/Constant_37"Constant*H value*<B,/blocks.23/self_attn/Constant_37_attr::valueJ )/blocks.23/self_attn/Constant_38_output_0 /blocks.23/self_attn/Constant_38"Constant*H value*<B,/blocks.23/self_attn/Constant_38_attr::valueJ  &/blocks.23/self_attn/Gather_8_output_0 )/blocks.23/self_attn/Constant_38_output_0*/blocks.23/self_attn/Unsqueeze_15_output_0!/blocks.23/self_attn/Unsqueeze_15" Unsqueeze )/blocks.23/self_attn/Constant_39_output_0 /blocks.23/self_attn/Constant_39"Constant*H value*<B,/blocks.23/self_attn/Constant_39_attr::valueJ  &/blocks.23/self_attn/Gather_9_output_0 )/blocks.23/self_attn/Constant_39_output_0*/blocks.23/self_attn/Unsqueeze_16_output_0!/blocks.23/self_attn/Unsqueeze_16" Unsqueeze  */blocks.23/self_attn/Unsqueeze_13_output_0 */blocks.23/self_attn/Unsqueeze_14_output_0 )/blocks.23/self_attn/Constant_37_output_0 */blocks.23/self_attn/Unsqueeze_15_output_0 */blocks.23/self_attn/Unsqueeze_16_output_0&/blocks.23/self_attn/Concat_8_output_0/blocks.23/self_attn/Concat_8"Concat* axis )/blocks.23/self_attn/Constant_40_output_0 /blocks.23/self_attn/Constant_40"Constant*H value*<B,/blocks.23/self_attn/Constant_40_attr::valueJ  &/blocks.23/self_attn/Concat_8_output_0 )/blocks.23/self_attn/Constant_40_output_0'/blocks.23/self_attn/Reshape_3_output_0/blocks.23/self_attn/Reshape_3"Reshape* allowzero u '/blocks.23/self_attn/Reshape_3_output_0%/blocks.23/self_attn/Shape_8_output_0/blocks.23/self_attn/Shape_8"Shape  %/blocks.23/self_attn/Shape_8_output_0-/blocks.23/self_attn/ConstantOfShape_output_0$/blocks.23/self_attn/ConstantOfShape"ConstantOfShape*L value*@B0/blocks.23/self_attn/ConstantOfShape_attr::valueJ )/blocks.23/self_attn/Constant_41_output_0 /blocks.23/self_attn/Constant_41"Constant*F value*:B,/blocks.23/self_attn/Constant_41_attr::valueJ  -/blocks.23/self_attn/ConstantOfShape_output_0 )/blocks.23/self_attn/Constant_41_output_0#/blocks.23/self_attn/Mul_4_output_0/blocks.23/self_attn/Mul_4"Mul  '/blocks.23/self_attn/Reshape_3_output_0 #/blocks.23/self_attn/Mul_4_output_0#/blocks.23/self_attn/Equal_output_0/blocks.23/self_attn/Equal"Equal  #/blocks.23/self_attn/Equal_output_0 -/blocks.23/self_attn/ConstantOfShape_output_0 '/blocks.23/self_attn/Reshape_3_output_0#/blocks.23/self_attn/Where_output_0/blocks.23/self_attn/Where"Where  */blocks.23/self_attn/Unsqueeze_12_output_0 #/blocks.23/self_attn/Where_output_0$/blocks.23/self_attn/Expand_output_0/blocks.23/self_attn/Expand"Expand )/blocks.23/self_attn/Constant_42_output_0 /blocks.23/self_attn/Constant_42"Constant*F value*:B,/blocks.23/self_attn/Constant_42_attr::valueJ  &/blocks.23/self_attn/Gather_7_output_0 )/blocks.23/self_attn/Constant_42_output_0#/blocks.23/self_attn/Mul_5_output_0/blocks.23/self_attn/Mul_5"Mul fonnx::Unsqueeze_7224 Constant_8743"Constant*5 value*)BConstant_8743_attr::valueJ  &/blocks.23/self_attn/Gather_6_output_0 onnx::Unsqueeze_7224*/blocks.23/self_attn/Unsqueeze_17_output_0!/blocks.23/self_attn/Unsqueeze_17" Unsqueeze fonnx::Unsqueeze_7226 Constant_8745"Constant*5 value*)BConstant_8745_attr::valueJ  #/blocks.23/self_attn/Mul_5_output_0 onnx::Unsqueeze_7226*/blocks.23/self_attn/Unsqueeze_18_output_0!/blocks.23/self_attn/Unsqueeze_18" Unsqueeze fonnx::Unsqueeze_7228 Constant_8747"Constant*5 value*)BConstant_8747_attr::valueJ  &/blocks.23/self_attn/Gather_8_output_0 onnx::Unsqueeze_7228*/blocks.23/self_attn/Unsqueeze_19_output_0!/blocks.23/self_attn/Unsqueeze_19" Unsqueeze fonnx::Unsqueeze_7230 Constant_8749"Constant*5 value*)BConstant_8749_attr::valueJ  &/blocks.23/self_attn/Gather_9_output_0 onnx::Unsqueeze_7230*/blocks.23/self_attn/Unsqueeze_20_output_0!/blocks.23/self_attn/Unsqueeze_20" Unsqueeze  */blocks.23/self_attn/Unsqueeze_17_output_0 */blocks.23/self_attn/Unsqueeze_18_output_0 */blocks.23/self_attn/Unsqueeze_19_output_0 */blocks.23/self_attn/Unsqueeze_20_output_0&/blocks.23/self_attn/Concat_9_output_0/blocks.23/self_attn/Concat_9"Concat* axis  $/blocks.23/self_attn/Expand_output_0 &/blocks.23/self_attn/Concat_9_output_0'/blocks.23/self_attn/Reshape_4_output_0/blocks.23/self_attn/Reshape_4"Reshape* allowzero w )/blocks.23/self_attn/Transpose_2_output_0%/blocks.23/self_attn/Shape_9_output_0/blocks.23/self_attn/Shape_9"Shape )/blocks.23/self_attn/Constant_43_output_0 /blocks.23/self_attn/Constant_43"Constant*F value*:B,/blocks.23/self_attn/Constant_43_attr::valueJ  %/blocks.23/self_attn/Shape_9_output_0 )/blocks.23/self_attn/Constant_43_output_0'/blocks.23/self_attn/Gather_10_output_0/blocks.23/self_attn/Gather_10"Gather* axis y )/blocks.23/self_attn/Transpose_2_output_0&/blocks.23/self_attn/Shape_10_output_0/blocks.23/self_attn/Shape_10"Shape )/blocks.23/self_attn/Constant_44_output_0 /blocks.23/self_attn/Constant_44"Constant*F value*:B,/blocks.23/self_attn/Constant_44_attr::valueJ  &/blocks.23/self_attn/Shape_10_output_0 )/blocks.23/self_attn/Constant_44_output_0'/blocks.23/self_attn/Gather_11_output_0/blocks.23/self_attn/Gather_11"Gather* axis y )/blocks.23/self_attn/Transpose_2_output_0&/blocks.23/self_attn/Shape_11_output_0/blocks.23/self_attn/Shape_11"Shape )/blocks.23/self_attn/Constant_45_output_0 /blocks.23/self_attn/Constant_45"Constant*F value*:B,/blocks.23/self_attn/Constant_45_attr::valueJ  &/blocks.23/self_attn/Shape_11_output_0 )/blocks.23/self_attn/Constant_45_output_0'/blocks.23/self_attn/Gather_12_output_0/blocks.23/self_attn/Gather_12"Gather* axis y )/blocks.23/self_attn/Transpose_2_output_0&/blocks.23/self_attn/Shape_12_output_0/blocks.23/self_attn/Shape_12"Shape )/blocks.23/self_attn/Constant_46_output_0 /blocks.23/self_attn/Constant_46"Constant*F value*:B,/blocks.23/self_attn/Constant_46_attr::valueJ  &/blocks.23/self_attn/Shape_12_output_0 )/blocks.23/self_attn/Constant_46_output_0'/blocks.23/self_attn/Gather_13_output_0/blocks.23/self_attn/Gather_13"Gather* axis )/blocks.23/self_attn/Constant_47_output_0 /blocks.23/self_attn/Constant_47"Constant*H value*<B,/blocks.23/self_attn/Constant_47_attr::valueJ  )/blocks.23/self_attn/Transpose_2_output_0 )/blocks.23/self_attn/Constant_47_output_0*/blocks.23/self_attn/Unsqueeze_21_output_0!/blocks.23/self_attn/Unsqueeze_21" Unsqueeze )/blocks.23/self_attn/Constant_48_output_0 /blocks.23/self_attn/Constant_48"Constant*H value*<B,/blocks.23/self_attn/Constant_48_attr::valueJ  '/blocks.23/self_attn/Gather_10_output_0 )/blocks.23/self_attn/Constant_48_output_0*/blocks.23/self_attn/Unsqueeze_22_output_0!/blocks.23/self_attn/Unsqueeze_22" Unsqueeze )/blocks.23/self_attn/Constant_49_output_0 /blocks.23/self_attn/Constant_49"Constant*H value*<B,/blocks.23/self_attn/Constant_49_attr::valueJ  '/blocks.23/self_attn/Gather_11_output_0 )/blocks.23/self_attn/Constant_49_output_0*/blocks.23/self_attn/Unsqueeze_23_output_0!/blocks.23/self_attn/Unsqueeze_23" Unsqueeze )/blocks.23/self_attn/Constant_50_output_0 /blocks.23/self_attn/Constant_50"Constant*H value*<B,/blocks.23/self_attn/Constant_50_attr::valueJ )/blocks.23/self_attn/Constant_51_output_0 /blocks.23/self_attn/Constant_51"Constant*H value*<B,/blocks.23/self_attn/Constant_51_attr::valueJ  '/blocks.23/self_attn/Gather_12_output_0 )/blocks.23/self_attn/Constant_51_output_0*/blocks.23/self_attn/Unsqueeze_24_output_0!/blocks.23/self_attn/Unsqueeze_24" Unsqueeze )/blocks.23/self_attn/Constant_52_output_0 /blocks.23/self_attn/Constant_52"Constant*H value*<B,/blocks.23/self_attn/Constant_52_attr::valueJ  '/blocks.23/self_attn/Gather_13_output_0 )/blocks.23/self_attn/Constant_52_output_0*/blocks.23/self_attn/Unsqueeze_25_output_0!/blocks.23/self_attn/Unsqueeze_25" Unsqueeze  */blocks.23/self_attn/Unsqueeze_22_output_0 */blocks.23/self_attn/Unsqueeze_23_output_0 )/blocks.23/self_attn/Constant_50_output_0 */blocks.23/self_attn/Unsqueeze_24_output_0 */blocks.23/self_attn/Unsqueeze_25_output_0'/blocks.23/self_attn/Concat_10_output_0/blocks.23/self_attn/Concat_10"Concat* axis )/blocks.23/self_attn/Constant_53_output_0 /blocks.23/self_attn/Constant_53"Constant*H value*<B,/blocks.23/self_attn/Constant_53_attr::valueJ  '/blocks.23/self_attn/Concat_10_output_0 )/blocks.23/self_attn/Constant_53_output_0'/blocks.23/self_attn/Reshape_5_output_0/blocks.23/self_attn/Reshape_5"Reshape* allowzero w '/blocks.23/self_attn/Reshape_5_output_0&/blocks.23/self_attn/Shape_13_output_0/blocks.23/self_attn/Shape_13"Shape  &/blocks.23/self_attn/Shape_13_output_0//blocks.23/self_attn/ConstantOfShape_1_output_0&/blocks.23/self_attn/ConstantOfShape_1"ConstantOfShape*N value*BB2/blocks.23/self_attn/ConstantOfShape_1_attr::valueJ )/blocks.23/self_attn/Constant_54_output_0 /blocks.23/self_attn/Constant_54"Constant*F value*:B,/blocks.23/self_attn/Constant_54_attr::valueJ  //blocks.23/self_attn/ConstantOfShape_1_output_0 )/blocks.23/self_attn/Constant_54_output_0#/blocks.23/self_attn/Mul_6_output_0/blocks.23/self_attn/Mul_6"Mul  '/blocks.23/self_attn/Reshape_5_output_0 #/blocks.23/self_attn/Mul_6_output_0%/blocks.23/self_attn/Equal_1_output_0/blocks.23/self_attn/Equal_1"Equal  %/blocks.23/self_attn/Equal_1_output_0 //blocks.23/self_attn/ConstantOfShape_1_output_0 '/blocks.23/self_attn/Reshape_5_output_0%/blocks.23/self_attn/Where_1_output_0/blocks.23/self_attn/Where_1"Where  */blocks.23/self_attn/Unsqueeze_21_output_0 %/blocks.23/self_attn/Where_1_output_0&/blocks.23/self_attn/Expand_1_output_0/blocks.23/self_attn/Expand_1"Expand )/blocks.23/self_attn/Constant_55_output_0 /blocks.23/self_attn/Constant_55"Constant*F value*:B,/blocks.23/self_attn/Constant_55_attr::valueJ  '/blocks.23/self_attn/Gather_11_output_0 )/blocks.23/self_attn/Constant_55_output_0#/blocks.23/self_attn/Mul_7_output_0/blocks.23/self_attn/Mul_7"Mul fonnx::Unsqueeze_7270 Constant_8788"Constant*5 value*)BConstant_8788_attr::valueJ  '/blocks.23/self_attn/Gather_10_output_0 onnx::Unsqueeze_7270*/blocks.23/self_attn/Unsqueeze_26_output_0!/blocks.23/self_attn/Unsqueeze_26" Unsqueeze fonnx::Unsqueeze_7272 Constant_8790"Constant*5 value*)BConstant_8790_attr::valueJ  #/blocks.23/self_attn/Mul_7_output_0 onnx::Unsqueeze_7272*/blocks.23/self_attn/Unsqueeze_27_output_0!/blocks.23/self_attn/Unsqueeze_27" Unsqueeze fonnx::Unsqueeze_7274 Constant_8792"Constant*5 value*)BConstant_8792_attr::valueJ  '/blocks.23/self_attn/Gather_12_output_0 onnx::Unsqueeze_7274*/blocks.23/self_attn/Unsqueeze_28_output_0!/blocks.23/self_attn/Unsqueeze_28" Unsqueeze fonnx::Unsqueeze_7276 Constant_8794"Constant*5 value*)BConstant_8794_attr::valueJ  '/blocks.23/self_attn/Gather_13_output_0 onnx::Unsqueeze_7276*/blocks.23/self_attn/Unsqueeze_29_output_0!/blocks.23/self_attn/Unsqueeze_29" Unsqueeze  */blocks.23/self_attn/Unsqueeze_26_output_0 */blocks.23/self_attn/Unsqueeze_27_output_0 */blocks.23/self_attn/Unsqueeze_28_output_0 */blocks.23/self_attn/Unsqueeze_29_output_0'/blocks.23/self_attn/Concat_11_output_0/blocks.23/self_attn/Concat_11"Concat* axis  &/blocks.23/self_attn/Expand_1_output_0 '/blocks.23/self_attn/Concat_11_output_0'/blocks.23/self_attn/Reshape_6_output_0/blocks.23/self_attn/Reshape_6"Reshape* allowzero  '/blocks.23/self_attn/Transpose_output_0 '/blocks.23/self_attn/Reshape_4_output_0$/blocks.23/self_attn/MatMul_output_0/blocks.23/self_attn/MatMul"MatMul )/blocks.23/self_attn/Constant_56_output_0 /blocks.23/self_attn/Constant_56"Constant*B value*6B,/blocks.23/self_attn/Constant_56_attr::valueJ5A  $/blocks.23/self_attn/MatMul_output_0 )/blocks.23/self_attn/Constant_56_output_0#/blocks.23/self_attn/Div_2_output_0/blocks.23/self_attn/Div_2"Div { #/blocks.23/self_attn/Div_2_output_0 attention_mask#/blocks.23/self_attn/Add_2_output_0/blocks.23/self_attn/Add_2"Add  #/blocks.23/self_attn/Add_2_output_0%/blocks.23/self_attn/Softmax_output_0/blocks.23/self_attn/Softmax"Softmax* axis { %/blocks.23/self_attn/Softmax_output_0$/blocks.23/self_attn/Cast_4_output_0/blocks.23/self_attn/Cast_4"Cast* to  $/blocks.23/self_attn/Cast_4_output_0 '/blocks.23/self_attn/Reshape_6_output_0&/blocks.23/self_attn/MatMul_1_output_0/blocks.23/self_attn/MatMul_1"MatMul  &/blocks.23/self_attn/MatMul_1_output_0)/blocks.23/self_attn/Transpose_3_output_0 /blocks.23/self_attn/Transpose_3" Transpose* perm@@@@ fonnx::Unsqueeze_7288 Constant_8806"Constant*5 value*)BConstant_8806_attr::valueJ  $/blocks.23/self_attn/Gather_output_0 onnx::Unsqueeze_7288*/blocks.23/self_attn/Unsqueeze_30_output_0!/blocks.23/self_attn/Unsqueeze_30" Unsqueeze fonnx::Unsqueeze_7290 Constant_8808"Constant*5 value*)BConstant_8808_attr::valueJ  &/blocks.23/self_attn/Gather_1_output_0 onnx::Unsqueeze_7290*/blocks.23/self_attn/Unsqueeze_31_output_0!/blocks.23/self_attn/Unsqueeze_31" Unsqueeze )/blocks.23/self_attn/Constant_57_output_0 /blocks.23/self_attn/Constant_57"Constant*H value*<B,/blocks.23/self_attn/Constant_57_attr::valueJ  */blocks.23/self_attn/Unsqueeze_30_output_0 */blocks.23/self_attn/Unsqueeze_31_output_0 )/blocks.23/self_attn/Constant_57_output_0'/blocks.23/self_attn/Concat_12_output_0/blocks.23/self_attn/Concat_12"Concat* axis  )/blocks.23/self_attn/Transpose_3_output_0 '/blocks.23/self_attn/Concat_12_output_0'/blocks.23/self_attn/Reshape_7_output_0/blocks.23/self_attn/Reshape_7"Reshape* allowzero  '/blocks.23/self_attn/Reshape_7_output_0 onnx::MatMul_9233+/blocks.23/self_attn/o_proj/MatMul_output_0"/blocks.23/self_attn/o_proj/MatMul"MatMul  */blocks.23/input_layernorm/Cast_1_output_0 +/blocks.23/self_attn/o_proj/MatMul_output_0/blocks.23/Add_output_0/blocks.23/Add"Add  /blocks.23/Add_output_01/blocks.23/post_attention_layernorm/Cast_output_0(/blocks.23/post_attention_layernorm/Cast"Cast* to 5/blocks.23/post_attention_layernorm/Constant_output_0,/blocks.23/post_attention_layernorm/Constant"Constant*N value*BB8/blocks.23/post_attention_layernorm/Constant_attr::valueJ@  1/blocks.23/post_attention_layernorm/Cast_output_0 5/blocks.23/post_attention_layernorm/Constant_output_00/blocks.23/post_attention_layernorm/Pow_output_0'/blocks.23/post_attention_layernorm/Pow"Pow  0/blocks.23/post_attention_layernorm/Pow_output_07/blocks.23/post_attention_layernorm/ReduceMean_output_0./blocks.23/post_attention_layernorm/ReduceMean" ReduceMean* axes@* keepdims 7/blocks.23/post_attention_layernorm/Constant_1_output_0./blocks.23/post_attention_layernorm/Constant_1"Constant*P value*DB:/blocks.23/post_attention_layernorm/Constant_1_attr::valueJ75  7/blocks.23/post_attention_layernorm/ReduceMean_output_0 7/blocks.23/post_attention_layernorm/Constant_1_output_00/blocks.23/post_attention_layernorm/Add_output_0'/blocks.23/post_attention_layernorm/Add"Add  0/blocks.23/post_attention_layernorm/Add_output_01/blocks.23/post_attention_layernorm/Sqrt_output_0(/blocks.23/post_attention_layernorm/Sqrt"Sqrt 7/blocks.23/post_attention_layernorm/Constant_2_output_0./blocks.23/post_attention_layernorm/Constant_2"Constant*P value*DB:/blocks.23/post_attention_layernorm/Constant_2_attr::valueJ?  7/blocks.23/post_attention_layernorm/Constant_2_output_0 1/blocks.23/post_attention_layernorm/Sqrt_output_00/blocks.23/post_attention_layernorm/Div_output_0'/blocks.23/post_attention_layernorm/Div"Div  1/blocks.23/post_attention_layernorm/Cast_output_03/blocks.23/post_attention_layernorm/Cast_1_output_0*/blocks.23/post_attention_layernorm/Cast_1"Cast* to  3/blocks.23/post_attention_layernorm/Cast_1_output_0 0/blocks.23/post_attention_layernorm/Div_output_00/blocks.23/post_attention_layernorm/Mul_output_0'/blocks.23/post_attention_layernorm/Mul"Mul  0/blocks.23/post_attention_layernorm/Mul_output_0 )blocks.23.post_attention_layernorm.weight2/blocks.23/post_attention_layernorm/Mul_1_output_0)/blocks.23/post_attention_layernorm/Mul_1"Mul  2/blocks.23/post_attention_layernorm/Mul_1_output_03/blocks.23/post_attention_layernorm/Cast_2_output_0*/blocks.23/post_attention_layernorm/Cast_2"Cast* to  3/blocks.23/post_attention_layernorm/Cast_2_output_0 onnx::MatMul_9234(/blocks.23/mlp/gate_proj/MatMul_output_0/blocks.23/mlp/gate_proj/MatMul"MatMul z (/blocks.23/mlp/gate_proj/MatMul_output_0&/blocks.23/mlp/act_fn/Sigmoid_output_0/blocks.23/mlp/act_fn/Sigmoid"Sigmoid  (/blocks.23/mlp/gate_proj/MatMul_output_0 &/blocks.23/mlp/act_fn/Sigmoid_output_0"/blocks.23/mlp/act_fn/Mul_output_0/blocks.23/mlp/act_fn/Mul"Mul  3/blocks.23/post_attention_layernorm/Cast_2_output_0 onnx::MatMul_9235&/blocks.23/mlp/up_proj/MatMul_output_0/blocks.23/mlp/up_proj/MatMul"MatMul  "/blocks.23/mlp/act_fn/Mul_output_0 &/blocks.23/mlp/up_proj/MatMul_output_0/blocks.23/mlp/Mul_output_0/blocks.23/mlp/Mul"Mul  /blocks.23/mlp/Mul_output_0 onnx::MatMul_9236(/blocks.23/mlp/down_proj/MatMul_output_0/blocks.23/mlp/down_proj/MatMul"MatMul  3/blocks.23/post_attention_layernorm/Cast_1_output_0 (/blocks.23/mlp/down_proj/MatMul_output_0/blocks.23/Add_1_output_0/blocks.23/Add_1"Add c/Constant_16_output_0 /Constant_16"Constant*2 value*&B/Constant_16_attr::valueJ ^ past_key_values /Constant_16_output_0/Gather_24_output_0 /Gather_24"Gather* axis /blocks.24/Constant_output_0/blocks.24/Constant"Constant*K value*?B/blocks.24/Constant_attr::valueJ  /blocks.23/Add_1_output_0 /blocks.24/Constant_output_0/blocks.24/Reshape_output_0/blocks.24/Reshape"Reshape* allowzero y /blocks.24/Reshape_output_0(/blocks.24/input_layernorm/Cast_output_0/blocks.24/input_layernorm/Cast"Cast* to ,/blocks.24/input_layernorm/Constant_output_0#/blocks.24/input_layernorm/Constant"Constant*E value*9B//blocks.24/input_layernorm/Constant_attr::valueJ@  (/blocks.24/input_layernorm/Cast_output_0 ,/blocks.24/input_layernorm/Constant_output_0'/blocks.24/input_layernorm/Pow_output_0/blocks.24/input_layernorm/Pow"Pow  '/blocks.24/input_layernorm/Pow_output_0./blocks.24/input_layernorm/ReduceMean_output_0%/blocks.24/input_layernorm/ReduceMean" ReduceMean* axes@* keepdims ./blocks.24/input_layernorm/Constant_1_output_0%/blocks.24/input_layernorm/Constant_1"Constant*G value*;B1/blocks.24/input_layernorm/Constant_1_attr::valueJ75  ./blocks.24/input_layernorm/ReduceMean_output_0 ./blocks.24/input_layernorm/Constant_1_output_0'/blocks.24/input_layernorm/Add_output_0/blocks.24/input_layernorm/Add"Add z '/blocks.24/input_layernorm/Add_output_0(/blocks.24/input_layernorm/Sqrt_output_0/blocks.24/input_layernorm/Sqrt"Sqrt ./blocks.24/input_layernorm/Constant_2_output_0%/blocks.24/input_layernorm/Constant_2"Constant*G value*;B1/blocks.24/input_layernorm/Constant_2_attr::valueJ?  ./blocks.24/input_layernorm/Constant_2_output_0 (/blocks.24/input_layernorm/Sqrt_output_0'/blocks.24/input_layernorm/Div_output_0/blocks.24/input_layernorm/Div"Div  (/blocks.24/input_layernorm/Cast_output_0*/blocks.24/input_layernorm/Cast_1_output_0!/blocks.24/input_layernorm/Cast_1"Cast* to  */blocks.24/input_layernorm/Cast_1_output_0 '/blocks.24/input_layernorm/Div_output_0'/blocks.24/input_layernorm/Mul_output_0/blocks.24/input_layernorm/Mul"Mul  '/blocks.24/input_layernorm/Mul_output_0 blocks.24.input_layernorm.weight)/blocks.24/input_layernorm/Mul_1_output_0 /blocks.24/input_layernorm/Mul_1"Mul  )/blocks.24/input_layernorm/Mul_1_output_0*/blocks.24/input_layernorm/Cast_2_output_0!/blocks.24/input_layernorm/Cast_2"Cast* to t */blocks.24/input_layernorm/Cast_2_output_0#/blocks.24/self_attn/Shape_output_0/blocks.24/self_attn/Shape"Shape &/blocks.24/self_attn/Constant_output_0/blocks.24/self_attn/Constant"Constant*C value*7B)/blocks.24/self_attn/Constant_attr::valueJ  #/blocks.24/self_attn/Shape_output_0 &/blocks.24/self_attn/Constant_output_0$/blocks.24/self_attn/Gather_output_0/blocks.24/self_attn/Gather"Gather* axis x */blocks.24/input_layernorm/Cast_2_output_0%/blocks.24/self_attn/Shape_1_output_0/blocks.24/self_attn/Shape_1"Shape (/blocks.24/self_attn/Constant_1_output_0/blocks.24/self_attn/Constant_1"Constant*E value*9B+/blocks.24/self_attn/Constant_1_attr::valueJ  %/blocks.24/self_attn/Shape_1_output_0 (/blocks.24/self_attn/Constant_1_output_0&/blocks.24/self_attn/Gather_1_output_0/blocks.24/self_attn/Gather_1"Gather* axis  */blocks.24/input_layernorm/Cast_2_output_0 onnx::MatMul_9237+/blocks.24/self_attn/q_proj/MatMul_output_0"/blocks.24/self_attn/q_proj/MatMul"MatMul  */blocks.24/input_layernorm/Cast_2_output_0 onnx::MatMul_9238+/blocks.24/self_attn/k_proj/MatMul_output_0"/blocks.24/self_attn/k_proj/MatMul"MatMul  */blocks.24/input_layernorm/Cast_2_output_0 onnx::MatMul_9239+/blocks.24/self_attn/v_proj/MatMul_output_0"/blocks.24/self_attn/v_proj/MatMul"MatMul fonnx::Unsqueeze_7351 Constant_8861"Constant*5 value*)BConstant_8861_attr::valueJ  $/blocks.24/self_attn/Gather_output_0 onnx::Unsqueeze_7351'/blocks.24/self_attn/Unsqueeze_output_0/blocks.24/self_attn/Unsqueeze" Unsqueeze fonnx::Unsqueeze_7353 Constant_8863"Constant*5 value*)BConstant_8863_attr::valueJ  &/blocks.24/self_attn/Gather_1_output_0 onnx::Unsqueeze_7353)/blocks.24/self_attn/Unsqueeze_1_output_0 /blocks.24/self_attn/Unsqueeze_1" Unsqueeze (/blocks.24/self_attn/Constant_2_output_0/blocks.24/self_attn/Constant_2"Constant*G value*;B+/blocks.24/self_attn/Constant_2_attr::valueJ (/blocks.24/self_attn/Constant_3_output_0/blocks.24/self_attn/Constant_3"Constant*G value*;B+/blocks.24/self_attn/Constant_3_attr::valueJ  '/blocks.24/self_attn/Unsqueeze_output_0 )/blocks.24/self_attn/Unsqueeze_1_output_0 (/blocks.24/self_attn/Constant_2_output_0 (/blocks.24/self_attn/Constant_3_output_0$/blocks.24/self_attn/Concat_output_0/blocks.24/self_attn/Concat"Concat* axis  +/blocks.24/self_attn/q_proj/MatMul_output_0 $/blocks.24/self_attn/Concat_output_0%/blocks.24/self_attn/Reshape_output_0/blocks.24/self_attn/Reshape"Reshape* allowzero fonnx::Unsqueeze_7361 Constant_8869"Constant*5 value*)BConstant_8869_attr::valueJ  $/blocks.24/self_attn/Gather_output_0 onnx::Unsqueeze_7361)/blocks.24/self_attn/Unsqueeze_2_output_0 /blocks.24/self_attn/Unsqueeze_2" Unsqueeze fonnx::Unsqueeze_7363 Constant_8871"Constant*5 value*)BConstant_8871_attr::valueJ  &/blocks.24/self_attn/Gather_1_output_0 onnx::Unsqueeze_7363)/blocks.24/self_attn/Unsqueeze_3_output_0 /blocks.24/self_attn/Unsqueeze_3" Unsqueeze (/blocks.24/self_attn/Constant_4_output_0/blocks.24/self_attn/Constant_4"Constant*G value*;B+/blocks.24/self_attn/Constant_4_attr::valueJ (/blocks.24/self_attn/Constant_5_output_0/blocks.24/self_attn/Constant_5"Constant*G value*;B+/blocks.24/self_attn/Constant_5_attr::valueJ  )/blocks.24/self_attn/Unsqueeze_2_output_0 )/blocks.24/self_attn/Unsqueeze_3_output_0 (/blocks.24/self_attn/Constant_4_output_0 (/blocks.24/self_attn/Constant_5_output_0&/blocks.24/self_attn/Concat_1_output_0/blocks.24/self_attn/Concat_1"Concat* axis fonnx::Unsqueeze_7370 Constant_8876"Constant*5 value*)BConstant_8876_attr::valueJ  $/blocks.24/self_attn/Gather_output_0 onnx::Unsqueeze_7370)/blocks.24/self_attn/Unsqueeze_4_output_0 /blocks.24/self_attn/Unsqueeze_4" Unsqueeze fonnx::Unsqueeze_7372 Constant_8878"Constant*5 value*)BConstant_8878_attr::valueJ  &/blocks.24/self_attn/Gather_1_output_0 onnx::Unsqueeze_7372)/blocks.24/self_attn/Unsqueeze_5_output_0 /blocks.24/self_attn/Unsqueeze_5" Unsqueeze (/blocks.24/self_attn/Constant_6_output_0/blocks.24/self_attn/Constant_6"Constant*G value*;B+/blocks.24/self_attn/Constant_6_attr::valueJ (/blocks.24/self_attn/Constant_7_output_0/blocks.24/self_attn/Constant_7"Constant*G value*;B+/blocks.24/self_attn/Constant_7_attr::valueJ  )/blocks.24/self_attn/Unsqueeze_4_output_0 )/blocks.24/self_attn/Unsqueeze_5_output_0 (/blocks.24/self_attn/Constant_6_output_0 (/blocks.24/self_attn/Constant_7_output_0&/blocks.24/self_attn/Concat_2_output_0/blocks.24/self_attn/Concat_2"Concat* axis  +/blocks.24/self_attn/k_proj/MatMul_output_0 &/blocks.24/self_attn/Concat_1_output_0'/blocks.24/self_attn/Reshape_1_output_0/blocks.24/self_attn/Reshape_1"Reshape* allowzero  +/blocks.24/self_attn/v_proj/MatMul_output_0 &/blocks.24/self_attn/Concat_2_output_0'/blocks.24/self_attn/Reshape_2_output_0/blocks.24/self_attn/Reshape_2"Reshape* allowzero  %/blocks.24/self_attn/Reshape_output_0)/blocks.24/self_attn/q_norm/Cast_output_0 /blocks.24/self_attn/q_norm/Cast"Cast* to -/blocks.24/self_attn/q_norm/Constant_output_0$/blocks.24/self_attn/q_norm/Constant"Constant*F value*:B0/blocks.24/self_attn/q_norm/Constant_attr::valueJ@  )/blocks.24/self_attn/q_norm/Cast_output_0 -/blocks.24/self_attn/q_norm/Constant_output_0(/blocks.24/self_attn/q_norm/Pow_output_0/blocks.24/self_attn/q_norm/Pow"Pow  (/blocks.24/self_attn/q_norm/Pow_output_0//blocks.24/self_attn/q_norm/ReduceMean_output_0&/blocks.24/self_attn/q_norm/ReduceMean" ReduceMean* axes@* keepdims //blocks.24/self_attn/q_norm/Constant_1_output_0&/blocks.24/self_attn/q_norm/Constant_1"Constant*H value*<B2/blocks.24/self_attn/q_norm/Constant_1_attr::valueJ75  //blocks.24/self_attn/q_norm/ReduceMean_output_0 //blocks.24/self_attn/q_norm/Constant_1_output_0(/blocks.24/self_attn/q_norm/Add_output_0/blocks.24/self_attn/q_norm/Add"Add } (/blocks.24/self_attn/q_norm/Add_output_0)/blocks.24/self_attn/q_norm/Sqrt_output_0 /blocks.24/self_attn/q_norm/Sqrt"Sqrt //blocks.24/self_attn/q_norm/Constant_2_output_0&/blocks.24/self_attn/q_norm/Constant_2"Constant*H value*<B2/blocks.24/self_attn/q_norm/Constant_2_attr::valueJ?  //blocks.24/self_attn/q_norm/Constant_2_output_0 )/blocks.24/self_attn/q_norm/Sqrt_output_0(/blocks.24/self_attn/q_norm/Div_output_0/blocks.24/self_attn/q_norm/Div"Div  )/blocks.24/self_attn/q_norm/Cast_output_0+/blocks.24/self_attn/q_norm/Cast_1_output_0"/blocks.24/self_attn/q_norm/Cast_1"Cast* to  +/blocks.24/self_attn/q_norm/Cast_1_output_0 (/blocks.24/self_attn/q_norm/Div_output_0(/blocks.24/self_attn/q_norm/Mul_output_0/blocks.24/self_attn/q_norm/Mul"Mul  (/blocks.24/self_attn/q_norm/Mul_output_0 !blocks.24.self_attn.q_norm.weight*/blocks.24/self_attn/q_norm/Mul_1_output_0!/blocks.24/self_attn/q_norm/Mul_1"Mul  */blocks.24/self_attn/q_norm/Mul_1_output_0+/blocks.24/self_attn/q_norm/Cast_2_output_0"/blocks.24/self_attn/q_norm/Cast_2"Cast* to  '/blocks.24/self_attn/Reshape_1_output_0)/blocks.24/self_attn/k_norm/Cast_output_0 /blocks.24/self_attn/k_norm/Cast"Cast* to -/blocks.24/self_attn/k_norm/Constant_output_0$/blocks.24/self_attn/k_norm/Constant"Constant*F value*:B0/blocks.24/self_attn/k_norm/Constant_attr::valueJ@  )/blocks.24/self_attn/k_norm/Cast_output_0 -/blocks.24/self_attn/k_norm/Constant_output_0(/blocks.24/self_attn/k_norm/Pow_output_0/blocks.24/self_attn/k_norm/Pow"Pow  (/blocks.24/self_attn/k_norm/Pow_output_0//blocks.24/self_attn/k_norm/ReduceMean_output_0&/blocks.24/self_attn/k_norm/ReduceMean" ReduceMean* axes@* keepdims //blocks.24/self_attn/k_norm/Constant_1_output_0&/blocks.24/self_attn/k_norm/Constant_1"Constant*H value*<B2/blocks.24/self_attn/k_norm/Constant_1_attr::valueJ75  //blocks.24/self_attn/k_norm/ReduceMean_output_0 //blocks.24/self_attn/k_norm/Constant_1_output_0(/blocks.24/self_attn/k_norm/Add_output_0/blocks.24/self_attn/k_norm/Add"Add } (/blocks.24/self_attn/k_norm/Add_output_0)/blocks.24/self_attn/k_norm/Sqrt_output_0 /blocks.24/self_attn/k_norm/Sqrt"Sqrt //blocks.24/self_attn/k_norm/Constant_2_output_0&/blocks.24/self_attn/k_norm/Constant_2"Constant*H value*<B2/blocks.24/self_attn/k_norm/Constant_2_attr::valueJ?  //blocks.24/self_attn/k_norm/Constant_2_output_0 )/blocks.24/self_attn/k_norm/Sqrt_output_0(/blocks.24/self_attn/k_norm/Div_output_0/blocks.24/self_attn/k_norm/Div"Div  )/blocks.24/self_attn/k_norm/Cast_output_0+/blocks.24/self_attn/k_norm/Cast_1_output_0"/blocks.24/self_attn/k_norm/Cast_1"Cast* to  +/blocks.24/self_attn/k_norm/Cast_1_output_0 (/blocks.24/self_attn/k_norm/Div_output_0(/blocks.24/self_attn/k_norm/Mul_output_0/blocks.24/self_attn/k_norm/Mul"Mul  (/blocks.24/self_attn/k_norm/Mul_output_0 !blocks.24.self_attn.k_norm.weight*/blocks.24/self_attn/k_norm/Mul_1_output_0!/blocks.24/self_attn/k_norm/Mul_1"Mul  */blocks.24/self_attn/k_norm/Mul_1_output_0+/blocks.24/self_attn/k_norm/Cast_2_output_0"/blocks.24/self_attn/k_norm/Cast_2"Cast* to  +/blocks.24/self_attn/q_norm/Cast_2_output_0 %/blocks.0/self_attn/Gather_2_output_0!/blocks.24/self_attn/Mul_output_0/blocks.24/self_attn/Mul"Mul y +/blocks.24/self_attn/q_norm/Cast_2_output_0%/blocks.24/self_attn/Shape_2_output_0/blocks.24/self_attn/Shape_2"Shape (/blocks.24/self_attn/Constant_8_output_0/blocks.24/self_attn/Constant_8"Constant*E value*9B+/blocks.24/self_attn/Constant_8_attr::valueJ  %/blocks.24/self_attn/Shape_2_output_0 (/blocks.24/self_attn/Constant_8_output_0&/blocks.24/self_attn/Gather_2_output_0/blocks.24/self_attn/Gather_2"Gather* axis (/blocks.24/self_attn/Constant_9_output_0/blocks.24/self_attn/Constant_9"Constant*E value*9B+/blocks.24/self_attn/Constant_9_attr::valueJ  &/blocks.24/self_attn/Gather_2_output_0 (/blocks.24/self_attn/Constant_9_output_0!/blocks.24/self_attn/Div_output_0/blocks.24/self_attn/Div"Div s !/blocks.24/self_attn/Div_output_0"/blocks.24/self_attn/Cast_output_0/blocks.24/self_attn/Cast"Cast* to x "/blocks.24/self_attn/Cast_output_0$/blocks.24/self_attn/Cast_1_output_0/blocks.24/self_attn/Cast_1"Cast* to )/blocks.24/self_attn/Constant_10_output_0 /blocks.24/self_attn/Constant_10"Constant*H value*<B,/blocks.24/self_attn/Constant_10_attr::valueJ )/blocks.24/self_attn/Constant_11_output_0 /blocks.24/self_attn/Constant_11"Constant*H value*<B,/blocks.24/self_attn/Constant_11_attr::valueJ )/blocks.24/self_attn/Constant_12_output_0 /blocks.24/self_attn/Constant_12"Constant*H value*<B,/blocks.24/self_attn/Constant_12_attr::valueJ  $/blocks.24/self_attn/Cast_1_output_0 )/blocks.24/self_attn/Constant_12_output_0)/blocks.24/self_attn/Unsqueeze_6_output_0 /blocks.24/self_attn/Unsqueeze_6" Unsqueeze )/blocks.24/self_attn/Constant_13_output_0 /blocks.24/self_attn/Constant_13"Constant*H value*<B,/blocks.24/self_attn/Constant_13_attr::valueJ  +/blocks.24/self_attn/q_norm/Cast_2_output_0 )/blocks.24/self_attn/Constant_11_output_0 )/blocks.24/self_attn/Unsqueeze_6_output_0 )/blocks.24/self_attn/Constant_10_output_0 )/blocks.24/self_attn/Constant_13_output_0#/blocks.24/self_attn/Slice_output_0/blocks.24/self_attn/Slice"Slice )/blocks.24/self_attn/Constant_14_output_0 /blocks.24/self_attn/Constant_14"Constant*H value*<B,/blocks.24/self_attn/Constant_14_attr::valueJ )/blocks.24/self_attn/Constant_15_output_0 /blocks.24/self_attn/Constant_15"Constant*H value*<B,/blocks.24/self_attn/Constant_15_attr::valueJ  $/blocks.24/self_attn/Cast_1_output_0 )/blocks.24/self_attn/Constant_15_output_0)/blocks.24/self_attn/Unsqueeze_7_output_0 /blocks.24/self_attn/Unsqueeze_7" Unsqueeze )/blocks.24/self_attn/Constant_16_output_0 /blocks.24/self_attn/Constant_16"Constant*H value*<B,/blocks.24/self_attn/Constant_16_attr::valueJ )/blocks.24/self_attn/Constant_17_output_0 /blocks.24/self_attn/Constant_17"Constant*H value*<B,/blocks.24/self_attn/Constant_17_attr::valueJ  +/blocks.24/self_attn/q_norm/Cast_2_output_0 )/blocks.24/self_attn/Unsqueeze_7_output_0 )/blocks.24/self_attn/Constant_16_output_0 )/blocks.24/self_attn/Constant_14_output_0 )/blocks.24/self_attn/Constant_17_output_0%/blocks.24/self_attn/Slice_1_output_0/blocks.24/self_attn/Slice_1"Slice i %/blocks.24/self_attn/Slice_1_output_0!/blocks.24/self_attn/Neg_output_0/blocks.24/self_attn/Neg"Neg  !/blocks.24/self_attn/Neg_output_0 #/blocks.24/self_attn/Slice_output_0&/blocks.24/self_attn/Concat_3_output_0/blocks.24/self_attn/Concat_3"Concat* axis  &/blocks.24/self_attn/Concat_3_output_0 %/blocks.0/self_attn/Gather_3_output_0#/blocks.24/self_attn/Mul_1_output_0/blocks.24/self_attn/Mul_1"Mul  !/blocks.24/self_attn/Mul_output_0 #/blocks.24/self_attn/Mul_1_output_0!/blocks.24/self_attn/Add_output_0/blocks.24/self_attn/Add"Add  +/blocks.24/self_attn/k_norm/Cast_2_output_0 %/blocks.0/self_attn/Gather_2_output_0#/blocks.24/self_attn/Mul_2_output_0/blocks.24/self_attn/Mul_2"Mul y +/blocks.24/self_attn/k_norm/Cast_2_output_0%/blocks.24/self_attn/Shape_3_output_0/blocks.24/self_attn/Shape_3"Shape )/blocks.24/self_attn/Constant_18_output_0 /blocks.24/self_attn/Constant_18"Constant*F value*:B,/blocks.24/self_attn/Constant_18_attr::valueJ  %/blocks.24/self_attn/Shape_3_output_0 )/blocks.24/self_attn/Constant_18_output_0&/blocks.24/self_attn/Gather_3_output_0/blocks.24/self_attn/Gather_3"Gather* axis )/blocks.24/self_attn/Constant_19_output_0 /blocks.24/self_attn/Constant_19"Constant*F value*:B,/blocks.24/self_attn/Constant_19_attr::valueJ  &/blocks.24/self_attn/Gather_3_output_0 )/blocks.24/self_attn/Constant_19_output_0#/blocks.24/self_attn/Div_1_output_0/blocks.24/self_attn/Div_1"Div y #/blocks.24/self_attn/Div_1_output_0$/blocks.24/self_attn/Cast_2_output_0/blocks.24/self_attn/Cast_2"Cast* to z $/blocks.24/self_attn/Cast_2_output_0$/blocks.24/self_attn/Cast_3_output_0/blocks.24/self_attn/Cast_3"Cast* to )/blocks.24/self_attn/Constant_20_output_0 /blocks.24/self_attn/Constant_20"Constant*H value*<B,/blocks.24/self_attn/Constant_20_attr::valueJ )/blocks.24/self_attn/Constant_21_output_0 /blocks.24/self_attn/Constant_21"Constant*H value*<B,/blocks.24/self_attn/Constant_21_attr::valueJ )/blocks.24/self_attn/Constant_22_output_0 /blocks.24/self_attn/Constant_22"Constant*H value*<B,/blocks.24/self_attn/Constant_22_attr::valueJ  $/blocks.24/self_attn/Cast_3_output_0 )/blocks.24/self_attn/Constant_22_output_0)/blocks.24/self_attn/Unsqueeze_8_output_0 /blocks.24/self_attn/Unsqueeze_8" Unsqueeze )/blocks.24/self_attn/Constant_23_output_0 /blocks.24/self_attn/Constant_23"Constant*H value*<B,/blocks.24/self_attn/Constant_23_attr::valueJ  +/blocks.24/self_attn/k_norm/Cast_2_output_0 )/blocks.24/self_attn/Constant_21_output_0 )/blocks.24/self_attn/Unsqueeze_8_output_0 )/blocks.24/self_attn/Constant_20_output_0 )/blocks.24/self_attn/Constant_23_output_0%/blocks.24/self_attn/Slice_2_output_0/blocks.24/self_attn/Slice_2"Slice )/blocks.24/self_attn/Constant_24_output_0 /blocks.24/self_attn/Constant_24"Constant*H value*<B,/blocks.24/self_attn/Constant_24_attr::valueJ )/blocks.24/self_attn/Constant_25_output_0 /blocks.24/self_attn/Constant_25"Constant*H value*<B,/blocks.24/self_attn/Constant_25_attr::valueJ  $/blocks.24/self_attn/Cast_3_output_0 )/blocks.24/self_attn/Constant_25_output_0)/blocks.24/self_attn/Unsqueeze_9_output_0 /blocks.24/self_attn/Unsqueeze_9" Unsqueeze )/blocks.24/self_attn/Constant_26_output_0 /blocks.24/self_attn/Constant_26"Constant*H value*<B,/blocks.24/self_attn/Constant_26_attr::valueJ )/blocks.24/self_attn/Constant_27_output_0 /blocks.24/self_attn/Constant_27"Constant*H value*<B,/blocks.24/self_attn/Constant_27_attr::valueJ  +/blocks.24/self_attn/k_norm/Cast_2_output_0 )/blocks.24/self_attn/Unsqueeze_9_output_0 )/blocks.24/self_attn/Constant_26_output_0 )/blocks.24/self_attn/Constant_24_output_0 )/blocks.24/self_attn/Constant_27_output_0%/blocks.24/self_attn/Slice_3_output_0/blocks.24/self_attn/Slice_3"Slice m %/blocks.24/self_attn/Slice_3_output_0#/blocks.24/self_attn/Neg_1_output_0/blocks.24/self_attn/Neg_1"Neg  #/blocks.24/self_attn/Neg_1_output_0 %/blocks.24/self_attn/Slice_2_output_0&/blocks.24/self_attn/Concat_4_output_0/blocks.24/self_attn/Concat_4"Concat* axis  &/blocks.24/self_attn/Concat_4_output_0 %/blocks.0/self_attn/Gather_3_output_0#/blocks.24/self_attn/Mul_3_output_0/blocks.24/self_attn/Mul_3"Mul  #/blocks.24/self_attn/Mul_2_output_0 #/blocks.24/self_attn/Mul_3_output_0#/blocks.24/self_attn/Add_1_output_0/blocks.24/self_attn/Add_1"Add  /Gather_24_output_0 /rotary/Constant_3_output_0&/blocks.24/self_attn/Gather_4_output_0/blocks.24/self_attn/Gather_4"Gather* axis  /Gather_24_output_0 /rotary/Constant_8_output_0&/blocks.24/self_attn/Gather_5_output_0/blocks.24/self_attn/Gather_5"Gather* axis  &/blocks.24/self_attn/Gather_4_output_0 #/blocks.24/self_attn/Add_1_output_0&/blocks.24/self_attn/Concat_5_output_0/blocks.24/self_attn/Concat_5"Concat* axis  &/blocks.24/self_attn/Gather_5_output_0 '/blocks.24/self_attn/Reshape_2_output_0&/blocks.24/self_attn/Concat_6_output_0/blocks.24/self_attn/Concat_6"Concat* axis )/blocks.24/self_attn/Constant_28_output_0 /blocks.24/self_attn/Constant_28"Constant*H value*<B,/blocks.24/self_attn/Constant_28_attr::valueJ  &/blocks.24/self_attn/Concat_5_output_0 )/blocks.24/self_attn/Constant_28_output_0*/blocks.24/self_attn/Unsqueeze_10_output_0!/blocks.24/self_attn/Unsqueeze_10" Unsqueeze )/blocks.24/self_attn/Constant_29_output_0 /blocks.24/self_attn/Constant_29"Constant*H value*<B,/blocks.24/self_attn/Constant_29_attr::valueJ  &/blocks.24/self_attn/Concat_6_output_0 )/blocks.24/self_attn/Constant_29_output_0*/blocks.24/self_attn/Unsqueeze_11_output_0!/blocks.24/self_attn/Unsqueeze_11" Unsqueeze  */blocks.24/self_attn/Unsqueeze_10_output_0 */blocks.24/self_attn/Unsqueeze_11_output_0&/blocks.24/self_attn/Concat_7_output_0/blocks.24/self_attn/Concat_7"Concat* axis  !/blocks.24/self_attn/Add_output_0'/blocks.24/self_attn/Transpose_output_0/blocks.24/self_attn/Transpose" Transpose* perm@@@@  &/blocks.24/self_attn/Concat_5_output_0)/blocks.24/self_attn/Transpose_1_output_0 /blocks.24/self_attn/Transpose_1" Transpose* perm@@@@  &/blocks.24/self_attn/Concat_6_output_0)/blocks.24/self_attn/Transpose_2_output_0 /blocks.24/self_attn/Transpose_2" Transpose* perm@@@@ w )/blocks.24/self_attn/Transpose_1_output_0%/blocks.24/self_attn/Shape_4_output_0/blocks.24/self_attn/Shape_4"Shape )/blocks.24/self_attn/Constant_30_output_0 /blocks.24/self_attn/Constant_30"Constant*F value*:B,/blocks.24/self_attn/Constant_30_attr::valueJ  %/blocks.24/self_attn/Shape_4_output_0 )/blocks.24/self_attn/Constant_30_output_0&/blocks.24/self_attn/Gather_6_output_0/blocks.24/self_attn/Gather_6"Gather* axis w )/blocks.24/self_attn/Transpose_1_output_0%/blocks.24/self_attn/Shape_5_output_0/blocks.24/self_attn/Shape_5"Shape )/blocks.24/self_attn/Constant_31_output_0 /blocks.24/self_attn/Constant_31"Constant*F value*:B,/blocks.24/self_attn/Constant_31_attr::valueJ  %/blocks.24/self_attn/Shape_5_output_0 )/blocks.24/self_attn/Constant_31_output_0&/blocks.24/self_attn/Gather_7_output_0/blocks.24/self_attn/Gather_7"Gather* axis w )/blocks.24/self_attn/Transpose_1_output_0%/blocks.24/self_attn/Shape_6_output_0/blocks.24/self_attn/Shape_6"Shape )/blocks.24/self_attn/Constant_32_output_0 /blocks.24/self_attn/Constant_32"Constant*F value*:B,/blocks.24/self_attn/Constant_32_attr::valueJ  %/blocks.24/self_attn/Shape_6_output_0 )/blocks.24/self_attn/Constant_32_output_0&/blocks.24/self_attn/Gather_8_output_0/blocks.24/self_attn/Gather_8"Gather* axis w )/blocks.24/self_attn/Transpose_1_output_0%/blocks.24/self_attn/Shape_7_output_0/blocks.24/self_attn/Shape_7"Shape )/blocks.24/self_attn/Constant_33_output_0 /blocks.24/self_attn/Constant_33"Constant*F value*:B,/blocks.24/self_attn/Constant_33_attr::valueJ  %/blocks.24/self_attn/Shape_7_output_0 )/blocks.24/self_attn/Constant_33_output_0&/blocks.24/self_attn/Gather_9_output_0/blocks.24/self_attn/Gather_9"Gather* axis )/blocks.24/self_attn/Constant_34_output_0 /blocks.24/self_attn/Constant_34"Constant*H value*<B,/blocks.24/self_attn/Constant_34_attr::valueJ  )/blocks.24/self_attn/Transpose_1_output_0 )/blocks.24/self_attn/Constant_34_output_0*/blocks.24/self_attn/Unsqueeze_12_output_0!/blocks.24/self_attn/Unsqueeze_12" Unsqueeze )/blocks.24/self_attn/Constant_35_output_0 /blocks.24/self_attn/Constant_35"Constant*H value*<B,/blocks.24/self_attn/Constant_35_attr::valueJ  &/blocks.24/self_attn/Gather_6_output_0 )/blocks.24/self_attn/Constant_35_output_0*/blocks.24/self_attn/Unsqueeze_13_output_0!/blocks.24/self_attn/Unsqueeze_13" Unsqueeze )/blocks.24/self_attn/Constant_36_output_0 /blocks.24/self_attn/Constant_36"Constant*H value*<B,/blocks.24/self_attn/Constant_36_attr::valueJ  &/blocks.24/self_attn/Gather_7_output_0 )/blocks.24/self_attn/Constant_36_output_0*/blocks.24/self_attn/Unsqueeze_14_output_0!/blocks.24/self_attn/Unsqueeze_14" Unsqueeze )/blocks.24/self_attn/Constant_37_output_0 /blocks.24/self_attn/Constant_37"Constant*H value*<B,/blocks.24/self_attn/Constant_37_attr::valueJ )/blocks.24/self_attn/Constant_38_output_0 /blocks.24/self_attn/Constant_38"Constant*H value*<B,/blocks.24/self_attn/Constant_38_attr::valueJ  &/blocks.24/self_attn/Gather_8_output_0 )/blocks.24/self_attn/Constant_38_output_0*/blocks.24/self_attn/Unsqueeze_15_output_0!/blocks.24/self_attn/Unsqueeze_15" Unsqueeze )/blocks.24/self_attn/Constant_39_output_0 /blocks.24/self_attn/Constant_39"Constant*H value*<B,/blocks.24/self_attn/Constant_39_attr::valueJ  &/blocks.24/self_attn/Gather_9_output_0 )/blocks.24/self_attn/Constant_39_output_0*/blocks.24/self_attn/Unsqueeze_16_output_0!/blocks.24/self_attn/Unsqueeze_16" Unsqueeze  */blocks.24/self_attn/Unsqueeze_13_output_0 */blocks.24/self_attn/Unsqueeze_14_output_0 )/blocks.24/self_attn/Constant_37_output_0 */blocks.24/self_attn/Unsqueeze_15_output_0 */blocks.24/self_attn/Unsqueeze_16_output_0&/blocks.24/self_attn/Concat_8_output_0/blocks.24/self_attn/Concat_8"Concat* axis )/blocks.24/self_attn/Constant_40_output_0 /blocks.24/self_attn/Constant_40"Constant*H value*<B,/blocks.24/self_attn/Constant_40_attr::valueJ  &/blocks.24/self_attn/Concat_8_output_0 )/blocks.24/self_attn/Constant_40_output_0'/blocks.24/self_attn/Reshape_3_output_0/blocks.24/self_attn/Reshape_3"Reshape* allowzero u '/blocks.24/self_attn/Reshape_3_output_0%/blocks.24/self_attn/Shape_8_output_0/blocks.24/self_attn/Shape_8"Shape  %/blocks.24/self_attn/Shape_8_output_0-/blocks.24/self_attn/ConstantOfShape_output_0$/blocks.24/self_attn/ConstantOfShape"ConstantOfShape*L value*@B0/blocks.24/self_attn/ConstantOfShape_attr::valueJ )/blocks.24/self_attn/Constant_41_output_0 /blocks.24/self_attn/Constant_41"Constant*F value*:B,/blocks.24/self_attn/Constant_41_attr::valueJ  -/blocks.24/self_attn/ConstantOfShape_output_0 )/blocks.24/self_attn/Constant_41_output_0#/blocks.24/self_attn/Mul_4_output_0/blocks.24/self_attn/Mul_4"Mul  '/blocks.24/self_attn/Reshape_3_output_0 #/blocks.24/self_attn/Mul_4_output_0#/blocks.24/self_attn/Equal_output_0/blocks.24/self_attn/Equal"Equal  #/blocks.24/self_attn/Equal_output_0 -/blocks.24/self_attn/ConstantOfShape_output_0 '/blocks.24/self_attn/Reshape_3_output_0#/blocks.24/self_attn/Where_output_0/blocks.24/self_attn/Where"Where  */blocks.24/self_attn/Unsqueeze_12_output_0 #/blocks.24/self_attn/Where_output_0$/blocks.24/self_attn/Expand_output_0/blocks.24/self_attn/Expand"Expand )/blocks.24/self_attn/Constant_42_output_0 /blocks.24/self_attn/Constant_42"Constant*F value*:B,/blocks.24/self_attn/Constant_42_attr::valueJ  &/blocks.24/self_attn/Gather_7_output_0 )/blocks.24/self_attn/Constant_42_output_0#/blocks.24/self_attn/Mul_5_output_0/blocks.24/self_attn/Mul_5"Mul fonnx::Unsqueeze_7515 Constant_9006"Constant*5 value*)BConstant_9006_attr::valueJ  &/blocks.24/self_attn/Gather_6_output_0 onnx::Unsqueeze_7515*/blocks.24/self_attn/Unsqueeze_17_output_0!/blocks.24/self_attn/Unsqueeze_17" Unsqueeze fonnx::Unsqueeze_7517 Constant_9008"Constant*5 value*)BConstant_9008_attr::valueJ  #/blocks.24/self_attn/Mul_5_output_0 onnx::Unsqueeze_7517*/blocks.24/self_attn/Unsqueeze_18_output_0!/blocks.24/self_attn/Unsqueeze_18" Unsqueeze fonnx::Unsqueeze_7519 Constant_9010"Constant*5 value*)BConstant_9010_attr::valueJ  &/blocks.24/self_attn/Gather_8_output_0 onnx::Unsqueeze_7519*/blocks.24/self_attn/Unsqueeze_19_output_0!/blocks.24/self_attn/Unsqueeze_19" Unsqueeze fonnx::Unsqueeze_7521 Constant_9012"Constant*5 value*)BConstant_9012_attr::valueJ  &/blocks.24/self_attn/Gather_9_output_0 onnx::Unsqueeze_7521*/blocks.24/self_attn/Unsqueeze_20_output_0!/blocks.24/self_attn/Unsqueeze_20" Unsqueeze  */blocks.24/self_attn/Unsqueeze_17_output_0 */blocks.24/self_attn/Unsqueeze_18_output_0 */blocks.24/self_attn/Unsqueeze_19_output_0 */blocks.24/self_attn/Unsqueeze_20_output_0&/blocks.24/self_attn/Concat_9_output_0/blocks.24/self_attn/Concat_9"Concat* axis  $/blocks.24/self_attn/Expand_output_0 &/blocks.24/self_attn/Concat_9_output_0'/blocks.24/self_attn/Reshape_4_output_0/blocks.24/self_attn/Reshape_4"Reshape* allowzero w )/blocks.24/self_attn/Transpose_2_output_0%/blocks.24/self_attn/Shape_9_output_0/blocks.24/self_attn/Shape_9"Shape )/blocks.24/self_attn/Constant_43_output_0 /blocks.24/self_attn/Constant_43"Constant*F value*:B,/blocks.24/self_attn/Constant_43_attr::valueJ  %/blocks.24/self_attn/Shape_9_output_0 )/blocks.24/self_attn/Constant_43_output_0'/blocks.24/self_attn/Gather_10_output_0/blocks.24/self_attn/Gather_10"Gather* axis y )/blocks.24/self_attn/Transpose_2_output_0&/blocks.24/self_attn/Shape_10_output_0/blocks.24/self_attn/Shape_10"Shape )/blocks.24/self_attn/Constant_44_output_0 /blocks.24/self_attn/Constant_44"Constant*F value*:B,/blocks.24/self_attn/Constant_44_attr::valueJ  &/blocks.24/self_attn/Shape_10_output_0 )/blocks.24/self_attn/Constant_44_output_0'/blocks.24/self_attn/Gather_11_output_0/blocks.24/self_attn/Gather_11"Gather* axis y )/blocks.24/self_attn/Transpose_2_output_0&/blocks.24/self_attn/Shape_11_output_0/blocks.24/self_attn/Shape_11"Shape )/blocks.24/self_attn/Constant_45_output_0 /blocks.24/self_attn/Constant_45"Constant*F value*:B,/blocks.24/self_attn/Constant_45_attr::valueJ  &/blocks.24/self_attn/Shape_11_output_0 )/blocks.24/self_attn/Constant_45_output_0'/blocks.24/self_attn/Gather_12_output_0/blocks.24/self_attn/Gather_12"Gather* axis y )/blocks.24/self_attn/Transpose_2_output_0&/blocks.24/self_attn/Shape_12_output_0/blocks.24/self_attn/Shape_12"Shape )/blocks.24/self_attn/Constant_46_output_0 /blocks.24/self_attn/Constant_46"Constant*F value*:B,/blocks.24/self_attn/Constant_46_attr::valueJ  &/blocks.24/self_attn/Shape_12_output_0 )/blocks.24/self_attn/Constant_46_output_0'/blocks.24/self_attn/Gather_13_output_0/blocks.24/self_attn/Gather_13"Gather* axis )/blocks.24/self_attn/Constant_47_output_0 /blocks.24/self_attn/Constant_47"Constant*H value*<B,/blocks.24/self_attn/Constant_47_attr::valueJ  )/blocks.24/self_attn/Transpose_2_output_0 )/blocks.24/self_attn/Constant_47_output_0*/blocks.24/self_attn/Unsqueeze_21_output_0!/blocks.24/self_attn/Unsqueeze_21" Unsqueeze )/blocks.24/self_attn/Constant_48_output_0 /blocks.24/self_attn/Constant_48"Constant*H value*<B,/blocks.24/self_attn/Constant_48_attr::valueJ  '/blocks.24/self_attn/Gather_10_output_0 )/blocks.24/self_attn/Constant_48_output_0*/blocks.24/self_attn/Unsqueeze_22_output_0!/blocks.24/self_attn/Unsqueeze_22" Unsqueeze )/blocks.24/self_attn/Constant_49_output_0 /blocks.24/self_attn/Constant_49"Constant*H value*<B,/blocks.24/self_attn/Constant_49_attr::valueJ  '/blocks.24/self_attn/Gather_11_output_0 )/blocks.24/self_attn/Constant_49_output_0*/blocks.24/self_attn/Unsqueeze_23_output_0!/blocks.24/self_attn/Unsqueeze_23" Unsqueeze )/blocks.24/self_attn/Constant_50_output_0 /blocks.24/self_attn/Constant_50"Constant*H value*<B,/blocks.24/self_attn/Constant_50_attr::valueJ )/blocks.24/self_attn/Constant_51_output_0 /blocks.24/self_attn/Constant_51"Constant*H value*<B,/blocks.24/self_attn/Constant_51_attr::valueJ  '/blocks.24/self_attn/Gather_12_output_0 )/blocks.24/self_attn/Constant_51_output_0*/blocks.24/self_attn/Unsqueeze_24_output_0!/blocks.24/self_attn/Unsqueeze_24" Unsqueeze )/blocks.24/self_attn/Constant_52_output_0 /blocks.24/self_attn/Constant_52"Constant*H value*<B,/blocks.24/self_attn/Constant_52_attr::valueJ  '/blocks.24/self_attn/Gather_13_output_0 )/blocks.24/self_attn/Constant_52_output_0*/blocks.24/self_attn/Unsqueeze_25_output_0!/blocks.24/self_attn/Unsqueeze_25" Unsqueeze  */blocks.24/self_attn/Unsqueeze_22_output_0 */blocks.24/self_attn/Unsqueeze_23_output_0 )/blocks.24/self_attn/Constant_50_output_0 */blocks.24/self_attn/Unsqueeze_24_output_0 */blocks.24/self_attn/Unsqueeze_25_output_0'/blocks.24/self_attn/Concat_10_output_0/blocks.24/self_attn/Concat_10"Concat* axis )/blocks.24/self_attn/Constant_53_output_0 /blocks.24/self_attn/Constant_53"Constant*H value*<B,/blocks.24/self_attn/Constant_53_attr::valueJ  '/blocks.24/self_attn/Concat_10_output_0 )/blocks.24/self_attn/Constant_53_output_0'/blocks.24/self_attn/Reshape_5_output_0/blocks.24/self_attn/Reshape_5"Reshape* allowzero w '/blocks.24/self_attn/Reshape_5_output_0&/blocks.24/self_attn/Shape_13_output_0/blocks.24/self_attn/Shape_13"Shape  &/blocks.24/self_attn/Shape_13_output_0//blocks.24/self_attn/ConstantOfShape_1_output_0&/blocks.24/self_attn/ConstantOfShape_1"ConstantOfShape*N value*BB2/blocks.24/self_attn/ConstantOfShape_1_attr::valueJ )/blocks.24/self_attn/Constant_54_output_0 /blocks.24/self_attn/Constant_54"Constant*F value*:B,/blocks.24/self_attn/Constant_54_attr::valueJ  //blocks.24/self_attn/ConstantOfShape_1_output_0 )/blocks.24/self_attn/Constant_54_output_0#/blocks.24/self_attn/Mul_6_output_0/blocks.24/self_attn/Mul_6"Mul  '/blocks.24/self_attn/Reshape_5_output_0 #/blocks.24/self_attn/Mul_6_output_0%/blocks.24/self_attn/Equal_1_output_0/blocks.24/self_attn/Equal_1"Equal  %/blocks.24/self_attn/Equal_1_output_0 //blocks.24/self_attn/ConstantOfShape_1_output_0 '/blocks.24/self_attn/Reshape_5_output_0%/blocks.24/self_attn/Where_1_output_0/blocks.24/self_attn/Where_1"Where  */blocks.24/self_attn/Unsqueeze_21_output_0 %/blocks.24/self_attn/Where_1_output_0&/blocks.24/self_attn/Expand_1_output_0/blocks.24/self_attn/Expand_1"Expand )/blocks.24/self_attn/Constant_55_output_0 /blocks.24/self_attn/Constant_55"Constant*F value*:B,/blocks.24/self_attn/Constant_55_attr::valueJ  '/blocks.24/self_attn/Gather_11_output_0 )/blocks.24/self_attn/Constant_55_output_0#/blocks.24/self_attn/Mul_7_output_0/blocks.24/self_attn/Mul_7"Mul fonnx::Unsqueeze_7561 Constant_9051"Constant*5 value*)BConstant_9051_attr::valueJ  '/blocks.24/self_attn/Gather_10_output_0 onnx::Unsqueeze_7561*/blocks.24/self_attn/Unsqueeze_26_output_0!/blocks.24/self_attn/Unsqueeze_26" Unsqueeze fonnx::Unsqueeze_7563 Constant_9053"Constant*5 value*)BConstant_9053_attr::valueJ  #/blocks.24/self_attn/Mul_7_output_0 onnx::Unsqueeze_7563*/blocks.24/self_attn/Unsqueeze_27_output_0!/blocks.24/self_attn/Unsqueeze_27" Unsqueeze fonnx::Unsqueeze_7565 Constant_9055"Constant*5 value*)BConstant_9055_attr::valueJ  '/blocks.24/self_attn/Gather_12_output_0 onnx::Unsqueeze_7565*/blocks.24/self_attn/Unsqueeze_28_output_0!/blocks.24/self_attn/Unsqueeze_28" Unsqueeze fonnx::Unsqueeze_7567 Constant_9057"Constant*5 value*)BConstant_9057_attr::valueJ  '/blocks.24/self_attn/Gather_13_output_0 onnx::Unsqueeze_7567*/blocks.24/self_attn/Unsqueeze_29_output_0!/blocks.24/self_attn/Unsqueeze_29" Unsqueeze  */blocks.24/self_attn/Unsqueeze_26_output_0 */blocks.24/self_attn/Unsqueeze_27_output_0 */blocks.24/self_attn/Unsqueeze_28_output_0 */blocks.24/self_attn/Unsqueeze_29_output_0'/blocks.24/self_attn/Concat_11_output_0/blocks.24/self_attn/Concat_11"Concat* axis  &/blocks.24/self_attn/Expand_1_output_0 '/blocks.24/self_attn/Concat_11_output_0'/blocks.24/self_attn/Reshape_6_output_0/blocks.24/self_attn/Reshape_6"Reshape* allowzero  '/blocks.24/self_attn/Transpose_output_0 '/blocks.24/self_attn/Reshape_4_output_0$/blocks.24/self_attn/MatMul_output_0/blocks.24/self_attn/MatMul"MatMul )/blocks.24/self_attn/Constant_56_output_0 /blocks.24/self_attn/Constant_56"Constant*B value*6B,/blocks.24/self_attn/Constant_56_attr::valueJ5A  $/blocks.24/self_attn/MatMul_output_0 )/blocks.24/self_attn/Constant_56_output_0#/blocks.24/self_attn/Div_2_output_0/blocks.24/self_attn/Div_2"Div { #/blocks.24/self_attn/Div_2_output_0 attention_mask#/blocks.24/self_attn/Add_2_output_0/blocks.24/self_attn/Add_2"Add  #/blocks.24/self_attn/Add_2_output_0%/blocks.24/self_attn/Softmax_output_0/blocks.24/self_attn/Softmax"Softmax* axis { %/blocks.24/self_attn/Softmax_output_0$/blocks.24/self_attn/Cast_4_output_0/blocks.24/self_attn/Cast_4"Cast* to  $/blocks.24/self_attn/Cast_4_output_0 '/blocks.24/self_attn/Reshape_6_output_0&/blocks.24/self_attn/MatMul_1_output_0/blocks.24/self_attn/MatMul_1"MatMul  &/blocks.24/self_attn/MatMul_1_output_0)/blocks.24/self_attn/Transpose_3_output_0 /blocks.24/self_attn/Transpose_3" Transpose* perm@@@@ fonnx::Unsqueeze_7579 Constant_9069"Constant*5 value*)BConstant_9069_attr::valueJ  $/blocks.24/self_attn/Gather_output_0 onnx::Unsqueeze_7579*/blocks.24/self_attn/Unsqueeze_30_output_0!/blocks.24/self_attn/Unsqueeze_30" Unsqueeze fonnx::Unsqueeze_7581 Constant_9071"Constant*5 value*)BConstant_9071_attr::valueJ  &/blocks.24/self_attn/Gather_1_output_0 onnx::Unsqueeze_7581*/blocks.24/self_attn/Unsqueeze_31_output_0!/blocks.24/self_attn/Unsqueeze_31" Unsqueeze )/blocks.24/self_attn/Constant_57_output_0 /blocks.24/self_attn/Constant_57"Constant*H value*<B,/blocks.24/self_attn/Constant_57_attr::valueJ  */blocks.24/self_attn/Unsqueeze_30_output_0 */blocks.24/self_attn/Unsqueeze_31_output_0 )/blocks.24/self_attn/Constant_57_output_0'/blocks.24/self_attn/Concat_12_output_0/blocks.24/self_attn/Concat_12"Concat* axis  )/blocks.24/self_attn/Transpose_3_output_0 '/blocks.24/self_attn/Concat_12_output_0'/blocks.24/self_attn/Reshape_7_output_0/blocks.24/self_attn/Reshape_7"Reshape* allowzero  '/blocks.24/self_attn/Reshape_7_output_0 onnx::MatMul_9261+/blocks.24/self_attn/o_proj/MatMul_output_0"/blocks.24/self_attn/o_proj/MatMul"MatMul  */blocks.24/input_layernorm/Cast_1_output_0 +/blocks.24/self_attn/o_proj/MatMul_output_0/blocks.24/Add_output_0/blocks.24/Add"Add  /blocks.24/Add_output_01/blocks.24/post_attention_layernorm/Cast_output_0(/blocks.24/post_attention_layernorm/Cast"Cast* to 5/blocks.24/post_attention_layernorm/Constant_output_0,/blocks.24/post_attention_layernorm/Constant"Constant*N value*BB8/blocks.24/post_attention_layernorm/Constant_attr::valueJ@  1/blocks.24/post_attention_layernorm/Cast_output_0 5/blocks.24/post_attention_layernorm/Constant_output_00/blocks.24/post_attention_layernorm/Pow_output_0'/blocks.24/post_attention_layernorm/Pow"Pow  0/blocks.24/post_attention_layernorm/Pow_output_07/blocks.24/post_attention_layernorm/ReduceMean_output_0./blocks.24/post_attention_layernorm/ReduceMean" ReduceMean* axes@* keepdims 7/blocks.24/post_attention_layernorm/Constant_1_output_0./blocks.24/post_attention_layernorm/Constant_1"Constant*P value*DB:/blocks.24/post_attention_layernorm/Constant_1_attr::valueJ75  7/blocks.24/post_attention_layernorm/ReduceMean_output_0 7/blocks.24/post_attention_layernorm/Constant_1_output_00/blocks.24/post_attention_layernorm/Add_output_0'/blocks.24/post_attention_layernorm/Add"Add  0/blocks.24/post_attention_layernorm/Add_output_01/blocks.24/post_attention_layernorm/Sqrt_output_0(/blocks.24/post_attention_layernorm/Sqrt"Sqrt 7/blocks.24/post_attention_layernorm/Constant_2_output_0./blocks.24/post_attention_layernorm/Constant_2"Constant*P value*DB:/blocks.24/post_attention_layernorm/Constant_2_attr::valueJ?  7/blocks.24/post_attention_layernorm/Constant_2_output_0 1/blocks.24/post_attention_layernorm/Sqrt_output_00/blocks.24/post_attention_layernorm/Div_output_0'/blocks.24/post_attention_layernorm/Div"Div  1/blocks.24/post_attention_layernorm/Cast_output_03/blocks.24/post_attention_layernorm/Cast_1_output_0*/blocks.24/post_attention_layernorm/Cast_1"Cast* to  3/blocks.24/post_attention_layernorm/Cast_1_output_0 0/blocks.24/post_attention_layernorm/Div_output_00/blocks.24/post_attention_layernorm/Mul_output_0'/blocks.24/post_attention_layernorm/Mul"Mul  0/blocks.24/post_attention_layernorm/Mul_output_0 )blocks.24.post_attention_layernorm.weight2/blocks.24/post_attention_layernorm/Mul_1_output_0)/blocks.24/post_attention_layernorm/Mul_1"Mul  2/blocks.24/post_attention_layernorm/Mul_1_output_03/blocks.24/post_attention_layernorm/Cast_2_output_0*/blocks.24/post_attention_layernorm/Cast_2"Cast* to  3/blocks.24/post_attention_layernorm/Cast_2_output_0 onnx::MatMul_9262(/blocks.24/mlp/gate_proj/MatMul_output_0/blocks.24/mlp/gate_proj/MatMul"MatMul z (/blocks.24/mlp/gate_proj/MatMul_output_0&/blocks.24/mlp/act_fn/Sigmoid_output_0/blocks.24/mlp/act_fn/Sigmoid"Sigmoid  (/blocks.24/mlp/gate_proj/MatMul_output_0 &/blocks.24/mlp/act_fn/Sigmoid_output_0"/blocks.24/mlp/act_fn/Mul_output_0/blocks.24/mlp/act_fn/Mul"Mul  3/blocks.24/post_attention_layernorm/Cast_2_output_0 onnx::MatMul_9263&/blocks.24/mlp/up_proj/MatMul_output_0/blocks.24/mlp/up_proj/MatMul"MatMul  "/blocks.24/mlp/act_fn/Mul_output_0 &/blocks.24/mlp/up_proj/MatMul_output_0/blocks.24/mlp/Mul_output_0/blocks.24/mlp/Mul"Mul  /blocks.24/mlp/Mul_output_0 onnx::MatMul_9264(/blocks.24/mlp/down_proj/MatMul_output_0/blocks.24/mlp/down_proj/MatMul"MatMul  3/blocks.24/post_attention_layernorm/Cast_1_output_0 (/blocks.24/mlp/down_proj/MatMul_output_0/blocks.24/Add_1_output_0/blocks.24/Add_1"Add c/Constant_17_output_0 /Constant_17"Constant*2 value*&B/Constant_17_attr::valueJ ^ past_key_values /Constant_17_output_0/Gather_25_output_0 /Gather_25"Gather* axis /blocks.25/Constant_output_0/blocks.25/Constant"Constant*K value*?B/blocks.25/Constant_attr::valueJ  /blocks.24/Add_1_output_0 /blocks.25/Constant_output_0/blocks.25/Reshape_output_0/blocks.25/Reshape"Reshape* allowzero y /blocks.25/Reshape_output_0(/blocks.25/input_layernorm/Cast_output_0/blocks.25/input_layernorm/Cast"Cast* to ,/blocks.25/input_layernorm/Constant_output_0#/blocks.25/input_layernorm/Constant"Constant*E value*9B//blocks.25/input_layernorm/Constant_attr::valueJ@  (/blocks.25/input_layernorm/Cast_output_0 ,/blocks.25/input_layernorm/Constant_output_0'/blocks.25/input_layernorm/Pow_output_0/blocks.25/input_layernorm/Pow"Pow  '/blocks.25/input_layernorm/Pow_output_0./blocks.25/input_layernorm/ReduceMean_output_0%/blocks.25/input_layernorm/ReduceMean" ReduceMean* axes@* keepdims ./blocks.25/input_layernorm/Constant_1_output_0%/blocks.25/input_layernorm/Constant_1"Constant*G value*;B1/blocks.25/input_layernorm/Constant_1_attr::valueJ75  ./blocks.25/input_layernorm/ReduceMean_output_0 ./blocks.25/input_layernorm/Constant_1_output_0'/blocks.25/input_layernorm/Add_output_0/blocks.25/input_layernorm/Add"Add z '/blocks.25/input_layernorm/Add_output_0(/blocks.25/input_layernorm/Sqrt_output_0/blocks.25/input_layernorm/Sqrt"Sqrt ./blocks.25/input_layernorm/Constant_2_output_0%/blocks.25/input_layernorm/Constant_2"Constant*G value*;B1/blocks.25/input_layernorm/Constant_2_attr::valueJ?  ./blocks.25/input_layernorm/Constant_2_output_0 (/blocks.25/input_layernorm/Sqrt_output_0'/blocks.25/input_layernorm/Div_output_0/blocks.25/input_layernorm/Div"Div  (/blocks.25/input_layernorm/Cast_output_0*/blocks.25/input_layernorm/Cast_1_output_0!/blocks.25/input_layernorm/Cast_1"Cast* to  */blocks.25/input_layernorm/Cast_1_output_0 '/blocks.25/input_layernorm/Div_output_0'/blocks.25/input_layernorm/Mul_output_0/blocks.25/input_layernorm/Mul"Mul  '/blocks.25/input_layernorm/Mul_output_0 blocks.25.input_layernorm.weight)/blocks.25/input_layernorm/Mul_1_output_0 /blocks.25/input_layernorm/Mul_1"Mul  )/blocks.25/input_layernorm/Mul_1_output_0*/blocks.25/input_layernorm/Cast_2_output_0!/blocks.25/input_layernorm/Cast_2"Cast* to t */blocks.25/input_layernorm/Cast_2_output_0#/blocks.25/self_attn/Shape_output_0/blocks.25/self_attn/Shape"Shape &/blocks.25/self_attn/Constant_output_0/blocks.25/self_attn/Constant"Constant*C value*7B)/blocks.25/self_attn/Constant_attr::valueJ  #/blocks.25/self_attn/Shape_output_0 &/blocks.25/self_attn/Constant_output_0$/blocks.25/self_attn/Gather_output_0/blocks.25/self_attn/Gather"Gather* axis x */blocks.25/input_layernorm/Cast_2_output_0%/blocks.25/self_attn/Shape_1_output_0/blocks.25/self_attn/Shape_1"Shape (/blocks.25/self_attn/Constant_1_output_0/blocks.25/self_attn/Constant_1"Constant*E value*9B+/blocks.25/self_attn/Constant_1_attr::valueJ  %/blocks.25/self_attn/Shape_1_output_0 (/blocks.25/self_attn/Constant_1_output_0&/blocks.25/self_attn/Gather_1_output_0/blocks.25/self_attn/Gather_1"Gather* axis  */blocks.25/input_layernorm/Cast_2_output_0 onnx::MatMul_9265+/blocks.25/self_attn/q_proj/MatMul_output_0"/blocks.25/self_attn/q_proj/MatMul"MatMul  */blocks.25/input_layernorm/Cast_2_output_0 onnx::MatMul_9266+/blocks.25/self_attn/k_proj/MatMul_output_0"/blocks.25/self_attn/k_proj/MatMul"MatMul  */blocks.25/input_layernorm/Cast_2_output_0 onnx::MatMul_9267+/blocks.25/self_attn/v_proj/MatMul_output_0"/blocks.25/self_attn/v_proj/MatMul"MatMul fonnx::Unsqueeze_7642 Constant_9124"Constant*5 value*)BConstant_9124_attr::valueJ  $/blocks.25/self_attn/Gather_output_0 onnx::Unsqueeze_7642'/blocks.25/self_attn/Unsqueeze_output_0/blocks.25/self_attn/Unsqueeze" Unsqueeze fonnx::Unsqueeze_7644 Constant_9126"Constant*5 value*)BConstant_9126_attr::valueJ  &/blocks.25/self_attn/Gather_1_output_0 onnx::Unsqueeze_7644)/blocks.25/self_attn/Unsqueeze_1_output_0 /blocks.25/self_attn/Unsqueeze_1" Unsqueeze (/blocks.25/self_attn/Constant_2_output_0/blocks.25/self_attn/Constant_2"Constant*G value*;B+/blocks.25/self_attn/Constant_2_attr::valueJ (/blocks.25/self_attn/Constant_3_output_0/blocks.25/self_attn/Constant_3"Constant*G value*;B+/blocks.25/self_attn/Constant_3_attr::valueJ  '/blocks.25/self_attn/Unsqueeze_output_0 )/blocks.25/self_attn/Unsqueeze_1_output_0 (/blocks.25/self_attn/Constant_2_output_0 (/blocks.25/self_attn/Constant_3_output_0$/blocks.25/self_attn/Concat_output_0/blocks.25/self_attn/Concat"Concat* axis  +/blocks.25/self_attn/q_proj/MatMul_output_0 $/blocks.25/self_attn/Concat_output_0%/blocks.25/self_attn/Reshape_output_0/blocks.25/self_attn/Reshape"Reshape* allowzero fonnx::Unsqueeze_7652 Constant_9132"Constant*5 value*)BConstant_9132_attr::valueJ  $/blocks.25/self_attn/Gather_output_0 onnx::Unsqueeze_7652)/blocks.25/self_attn/Unsqueeze_2_output_0 /blocks.25/self_attn/Unsqueeze_2" Unsqueeze fonnx::Unsqueeze_7654 Constant_9134"Constant*5 value*)BConstant_9134_attr::valueJ  &/blocks.25/self_attn/Gather_1_output_0 onnx::Unsqueeze_7654)/blocks.25/self_attn/Unsqueeze_3_output_0 /blocks.25/self_attn/Unsqueeze_3" Unsqueeze (/blocks.25/self_attn/Constant_4_output_0/blocks.25/self_attn/Constant_4"Constant*G value*;B+/blocks.25/self_attn/Constant_4_attr::valueJ (/blocks.25/self_attn/Constant_5_output_0/blocks.25/self_attn/Constant_5"Constant*G value*;B+/blocks.25/self_attn/Constant_5_attr::valueJ  )/blocks.25/self_attn/Unsqueeze_2_output_0 )/blocks.25/self_attn/Unsqueeze_3_output_0 (/blocks.25/self_attn/Constant_4_output_0 (/blocks.25/self_attn/Constant_5_output_0&/blocks.25/self_attn/Concat_1_output_0/blocks.25/self_attn/Concat_1"Concat* axis fonnx::Unsqueeze_7661 Constant_9139"Constant*5 value*)BConstant_9139_attr::valueJ  $/blocks.25/self_attn/Gather_output_0 onnx::Unsqueeze_7661)/blocks.25/self_attn/Unsqueeze_4_output_0 /blocks.25/self_attn/Unsqueeze_4" Unsqueeze fonnx::Unsqueeze_7663 Constant_9141"Constant*5 value*)BConstant_9141_attr::valueJ  &/blocks.25/self_attn/Gather_1_output_0 onnx::Unsqueeze_7663)/blocks.25/self_attn/Unsqueeze_5_output_0 /blocks.25/self_attn/Unsqueeze_5" Unsqueeze (/blocks.25/self_attn/Constant_6_output_0/blocks.25/self_attn/Constant_6"Constant*G value*;B+/blocks.25/self_attn/Constant_6_attr::valueJ (/blocks.25/self_attn/Constant_7_output_0/blocks.25/self_attn/Constant_7"Constant*G value*;B+/blocks.25/self_attn/Constant_7_attr::valueJ  )/blocks.25/self_attn/Unsqueeze_4_output_0 )/blocks.25/self_attn/Unsqueeze_5_output_0 (/blocks.25/self_attn/Constant_6_output_0 (/blocks.25/self_attn/Constant_7_output_0&/blocks.25/self_attn/Concat_2_output_0/blocks.25/self_attn/Concat_2"Concat* axis  +/blocks.25/self_attn/k_proj/MatMul_output_0 &/blocks.25/self_attn/Concat_1_output_0'/blocks.25/self_attn/Reshape_1_output_0/blocks.25/self_attn/Reshape_1"Reshape* allowzero  +/blocks.25/self_attn/v_proj/MatMul_output_0 &/blocks.25/self_attn/Concat_2_output_0'/blocks.25/self_attn/Reshape_2_output_0/blocks.25/self_attn/Reshape_2"Reshape* allowzero  %/blocks.25/self_attn/Reshape_output_0)/blocks.25/self_attn/q_norm/Cast_output_0 /blocks.25/self_attn/q_norm/Cast"Cast* to -/blocks.25/self_attn/q_norm/Constant_output_0$/blocks.25/self_attn/q_norm/Constant"Constant*F value*:B0/blocks.25/self_attn/q_norm/Constant_attr::valueJ@  )/blocks.25/self_attn/q_norm/Cast_output_0 -/blocks.25/self_attn/q_norm/Constant_output_0(/blocks.25/self_attn/q_norm/Pow_output_0/blocks.25/self_attn/q_norm/Pow"Pow  (/blocks.25/self_attn/q_norm/Pow_output_0//blocks.25/self_attn/q_norm/ReduceMean_output_0&/blocks.25/self_attn/q_norm/ReduceMean" ReduceMean* axes@* keepdims //blocks.25/self_attn/q_norm/Constant_1_output_0&/blocks.25/self_attn/q_norm/Constant_1"Constant*H value*<B2/blocks.25/self_attn/q_norm/Constant_1_attr::valueJ75  //blocks.25/self_attn/q_norm/ReduceMean_output_0 //blocks.25/self_attn/q_norm/Constant_1_output_0(/blocks.25/self_attn/q_norm/Add_output_0/blocks.25/self_attn/q_norm/Add"Add } (/blocks.25/self_attn/q_norm/Add_output_0)/blocks.25/self_attn/q_norm/Sqrt_output_0 /blocks.25/self_attn/q_norm/Sqrt"Sqrt //blocks.25/self_attn/q_norm/Constant_2_output_0&/blocks.25/self_attn/q_norm/Constant_2"Constant*H value*<B2/blocks.25/self_attn/q_norm/Constant_2_attr::valueJ?  //blocks.25/self_attn/q_norm/Constant_2_output_0 )/blocks.25/self_attn/q_norm/Sqrt_output_0(/blocks.25/self_attn/q_norm/Div_output_0/blocks.25/self_attn/q_norm/Div"Div  )/blocks.25/self_attn/q_norm/Cast_output_0+/blocks.25/self_attn/q_norm/Cast_1_output_0"/blocks.25/self_attn/q_norm/Cast_1"Cast* to  +/blocks.25/self_attn/q_norm/Cast_1_output_0 (/blocks.25/self_attn/q_norm/Div_output_0(/blocks.25/self_attn/q_norm/Mul_output_0/blocks.25/self_attn/q_norm/Mul"Mul  (/blocks.25/self_attn/q_norm/Mul_output_0 !blocks.25.self_attn.q_norm.weight*/blocks.25/self_attn/q_norm/Mul_1_output_0!/blocks.25/self_attn/q_norm/Mul_1"Mul  */blocks.25/self_attn/q_norm/Mul_1_output_0+/blocks.25/self_attn/q_norm/Cast_2_output_0"/blocks.25/self_attn/q_norm/Cast_2"Cast* to  '/blocks.25/self_attn/Reshape_1_output_0)/blocks.25/self_attn/k_norm/Cast_output_0 /blocks.25/self_attn/k_norm/Cast"Cast* to -/blocks.25/self_attn/k_norm/Constant_output_0$/blocks.25/self_attn/k_norm/Constant"Constant*F value*:B0/blocks.25/self_attn/k_norm/Constant_attr::valueJ@  )/blocks.25/self_attn/k_norm/Cast_output_0 -/blocks.25/self_attn/k_norm/Constant_output_0(/blocks.25/self_attn/k_norm/Pow_output_0/blocks.25/self_attn/k_norm/Pow"Pow  (/blocks.25/self_attn/k_norm/Pow_output_0//blocks.25/self_attn/k_norm/ReduceMean_output_0&/blocks.25/self_attn/k_norm/ReduceMean" ReduceMean* axes@* keepdims //blocks.25/self_attn/k_norm/Constant_1_output_0&/blocks.25/self_attn/k_norm/Constant_1"Constant*H value*<B2/blocks.25/self_attn/k_norm/Constant_1_attr::valueJ75  //blocks.25/self_attn/k_norm/ReduceMean_output_0 //blocks.25/self_attn/k_norm/Constant_1_output_0(/blocks.25/self_attn/k_norm/Add_output_0/blocks.25/self_attn/k_norm/Add"Add } (/blocks.25/self_attn/k_norm/Add_output_0)/blocks.25/self_attn/k_norm/Sqrt_output_0 /blocks.25/self_attn/k_norm/Sqrt"Sqrt //blocks.25/self_attn/k_norm/Constant_2_output_0&/blocks.25/self_attn/k_norm/Constant_2"Constant*H value*<B2/blocks.25/self_attn/k_norm/Constant_2_attr::valueJ?  //blocks.25/self_attn/k_norm/Constant_2_output_0 )/blocks.25/self_attn/k_norm/Sqrt_output_0(/blocks.25/self_attn/k_norm/Div_output_0/blocks.25/self_attn/k_norm/Div"Div  )/blocks.25/self_attn/k_norm/Cast_output_0+/blocks.25/self_attn/k_norm/Cast_1_output_0"/blocks.25/self_attn/k_norm/Cast_1"Cast* to  +/blocks.25/self_attn/k_norm/Cast_1_output_0 (/blocks.25/self_attn/k_norm/Div_output_0(/blocks.25/self_attn/k_norm/Mul_output_0/blocks.25/self_attn/k_norm/Mul"Mul  (/blocks.25/self_attn/k_norm/Mul_output_0 !blocks.25.self_attn.k_norm.weight*/blocks.25/self_attn/k_norm/Mul_1_output_0!/blocks.25/self_attn/k_norm/Mul_1"Mul  */blocks.25/self_attn/k_norm/Mul_1_output_0+/blocks.25/self_attn/k_norm/Cast_2_output_0"/blocks.25/self_attn/k_norm/Cast_2"Cast* to  +/blocks.25/self_attn/q_norm/Cast_2_output_0 %/blocks.0/self_attn/Gather_2_output_0!/blocks.25/self_attn/Mul_output_0/blocks.25/self_attn/Mul"Mul y +/blocks.25/self_attn/q_norm/Cast_2_output_0%/blocks.25/self_attn/Shape_2_output_0/blocks.25/self_attn/Shape_2"Shape (/blocks.25/self_attn/Constant_8_output_0/blocks.25/self_attn/Constant_8"Constant*E value*9B+/blocks.25/self_attn/Constant_8_attr::valueJ  %/blocks.25/self_attn/Shape_2_output_0 (/blocks.25/self_attn/Constant_8_output_0&/blocks.25/self_attn/Gather_2_output_0/blocks.25/self_attn/Gather_2"Gather* axis (/blocks.25/self_attn/Constant_9_output_0/blocks.25/self_attn/Constant_9"Constant*E value*9B+/blocks.25/self_attn/Constant_9_attr::valueJ  &/blocks.25/self_attn/Gather_2_output_0 (/blocks.25/self_attn/Constant_9_output_0!/blocks.25/self_attn/Div_output_0/blocks.25/self_attn/Div"Div s !/blocks.25/self_attn/Div_output_0"/blocks.25/self_attn/Cast_output_0/blocks.25/self_attn/Cast"Cast* to x "/blocks.25/self_attn/Cast_output_0$/blocks.25/self_attn/Cast_1_output_0/blocks.25/self_attn/Cast_1"Cast* to )/blocks.25/self_attn/Constant_10_output_0 /blocks.25/self_attn/Constant_10"Constant*H value*<B,/blocks.25/self_attn/Constant_10_attr::valueJ )/blocks.25/self_attn/Constant_11_output_0 /blocks.25/self_attn/Constant_11"Constant*H value*<B,/blocks.25/self_attn/Constant_11_attr::valueJ )/blocks.25/self_attn/Constant_12_output_0 /blocks.25/self_attn/Constant_12"Constant*H value*<B,/blocks.25/self_attn/Constant_12_attr::valueJ  $/blocks.25/self_attn/Cast_1_output_0 )/blocks.25/self_attn/Constant_12_output_0)/blocks.25/self_attn/Unsqueeze_6_output_0 /blocks.25/self_attn/Unsqueeze_6" Unsqueeze )/blocks.25/self_attn/Constant_13_output_0 /blocks.25/self_attn/Constant_13"Constant*H value*<B,/blocks.25/self_attn/Constant_13_attr::valueJ  +/blocks.25/self_attn/q_norm/Cast_2_output_0 )/blocks.25/self_attn/Constant_11_output_0 )/blocks.25/self_attn/Unsqueeze_6_output_0 )/blocks.25/self_attn/Constant_10_output_0 )/blocks.25/self_attn/Constant_13_output_0#/blocks.25/self_attn/Slice_output_0/blocks.25/self_attn/Slice"Slice )/blocks.25/self_attn/Constant_14_output_0 /blocks.25/self_attn/Constant_14"Constant*H value*<B,/blocks.25/self_attn/Constant_14_attr::valueJ )/blocks.25/self_attn/Constant_15_output_0 /blocks.25/self_attn/Constant_15"Constant*H value*<B,/blocks.25/self_attn/Constant_15_attr::valueJ  $/blocks.25/self_attn/Cast_1_output_0 )/blocks.25/self_attn/Constant_15_output_0)/blocks.25/self_attn/Unsqueeze_7_output_0 /blocks.25/self_attn/Unsqueeze_7" Unsqueeze )/blocks.25/self_attn/Constant_16_output_0 /blocks.25/self_attn/Constant_16"Constant*H value*<B,/blocks.25/self_attn/Constant_16_attr::valueJ )/blocks.25/self_attn/Constant_17_output_0 /blocks.25/self_attn/Constant_17"Constant*H value*<B,/blocks.25/self_attn/Constant_17_attr::valueJ  +/blocks.25/self_attn/q_norm/Cast_2_output_0 )/blocks.25/self_attn/Unsqueeze_7_output_0 )/blocks.25/self_attn/Constant_16_output_0 )/blocks.25/self_attn/Constant_14_output_0 )/blocks.25/self_attn/Constant_17_output_0%/blocks.25/self_attn/Slice_1_output_0/blocks.25/self_attn/Slice_1"Slice i %/blocks.25/self_attn/Slice_1_output_0!/blocks.25/self_attn/Neg_output_0/blocks.25/self_attn/Neg"Neg  !/blocks.25/self_attn/Neg_output_0 #/blocks.25/self_attn/Slice_output_0&/blocks.25/self_attn/Concat_3_output_0/blocks.25/self_attn/Concat_3"Concat* axis  &/blocks.25/self_attn/Concat_3_output_0 %/blocks.0/self_attn/Gather_3_output_0#/blocks.25/self_attn/Mul_1_output_0/blocks.25/self_attn/Mul_1"Mul  !/blocks.25/self_attn/Mul_output_0 #/blocks.25/self_attn/Mul_1_output_0!/blocks.25/self_attn/Add_output_0/blocks.25/self_attn/Add"Add  +/blocks.25/self_attn/k_norm/Cast_2_output_0 %/blocks.0/self_attn/Gather_2_output_0#/blocks.25/self_attn/Mul_2_output_0/blocks.25/self_attn/Mul_2"Mul y +/blocks.25/self_attn/k_norm/Cast_2_output_0%/blocks.25/self_attn/Shape_3_output_0/blocks.25/self_attn/Shape_3"Shape )/blocks.25/self_attn/Constant_18_output_0 /blocks.25/self_attn/Constant_18"Constant*F value*:B,/blocks.25/self_attn/Constant_18_attr::valueJ  %/blocks.25/self_attn/Shape_3_output_0 )/blocks.25/self_attn/Constant_18_output_0&/blocks.25/self_attn/Gather_3_output_0/blocks.25/self_attn/Gather_3"Gather* axis )/blocks.25/self_attn/Constant_19_output_0 /blocks.25/self_attn/Constant_19"Constant*F value*:B,/blocks.25/self_attn/Constant_19_attr::valueJ  &/blocks.25/self_attn/Gather_3_output_0 )/blocks.25/self_attn/Constant_19_output_0#/blocks.25/self_attn/Div_1_output_0/blocks.25/self_attn/Div_1"Div y #/blocks.25/self_attn/Div_1_output_0$/blocks.25/self_attn/Cast_2_output_0/blocks.25/self_attn/Cast_2"Cast* to z $/blocks.25/self_attn/Cast_2_output_0$/blocks.25/self_attn/Cast_3_output_0/blocks.25/self_attn/Cast_3"Cast* to )/blocks.25/self_attn/Constant_20_output_0 /blocks.25/self_attn/Constant_20"Constant*H value*<B,/blocks.25/self_attn/Constant_20_attr::valueJ )/blocks.25/self_attn/Constant_21_output_0 /blocks.25/self_attn/Constant_21"Constant*H value*<B,/blocks.25/self_attn/Constant_21_attr::valueJ )/blocks.25/self_attn/Constant_22_output_0 /blocks.25/self_attn/Constant_22"Constant*H value*<B,/blocks.25/self_attn/Constant_22_attr::valueJ  $/blocks.25/self_attn/Cast_3_output_0 )/blocks.25/self_attn/Constant_22_output_0)/blocks.25/self_attn/Unsqueeze_8_output_0 /blocks.25/self_attn/Unsqueeze_8" Unsqueeze )/blocks.25/self_attn/Constant_23_output_0 /blocks.25/self_attn/Constant_23"Constant*H value*<B,/blocks.25/self_attn/Constant_23_attr::valueJ  +/blocks.25/self_attn/k_norm/Cast_2_output_0 )/blocks.25/self_attn/Constant_21_output_0 )/blocks.25/self_attn/Unsqueeze_8_output_0 )/blocks.25/self_attn/Constant_20_output_0 )/blocks.25/self_attn/Constant_23_output_0%/blocks.25/self_attn/Slice_2_output_0/blocks.25/self_attn/Slice_2"Slice )/blocks.25/self_attn/Constant_24_output_0 /blocks.25/self_attn/Constant_24"Constant*H value*<B,/blocks.25/self_attn/Constant_24_attr::valueJ )/blocks.25/self_attn/Constant_25_output_0 /blocks.25/self_attn/Constant_25"Constant*H value*<B,/blocks.25/self_attn/Constant_25_attr::valueJ  $/blocks.25/self_attn/Cast_3_output_0 )/blocks.25/self_attn/Constant_25_output_0)/blocks.25/self_attn/Unsqueeze_9_output_0 /blocks.25/self_attn/Unsqueeze_9" Unsqueeze )/blocks.25/self_attn/Constant_26_output_0 /blocks.25/self_attn/Constant_26"Constant*H value*<B,/blocks.25/self_attn/Constant_26_attr::valueJ )/blocks.25/self_attn/Constant_27_output_0 /blocks.25/self_attn/Constant_27"Constant*H value*<B,/blocks.25/self_attn/Constant_27_attr::valueJ  +/blocks.25/self_attn/k_norm/Cast_2_output_0 )/blocks.25/self_attn/Unsqueeze_9_output_0 )/blocks.25/self_attn/Constant_26_output_0 )/blocks.25/self_attn/Constant_24_output_0 )/blocks.25/self_attn/Constant_27_output_0%/blocks.25/self_attn/Slice_3_output_0/blocks.25/self_attn/Slice_3"Slice m %/blocks.25/self_attn/Slice_3_output_0#/blocks.25/self_attn/Neg_1_output_0/blocks.25/self_attn/Neg_1"Neg  #/blocks.25/self_attn/Neg_1_output_0 %/blocks.25/self_attn/Slice_2_output_0&/blocks.25/self_attn/Concat_4_output_0/blocks.25/self_attn/Concat_4"Concat* axis  &/blocks.25/self_attn/Concat_4_output_0 %/blocks.0/self_attn/Gather_3_output_0#/blocks.25/self_attn/Mul_3_output_0/blocks.25/self_attn/Mul_3"Mul  #/blocks.25/self_attn/Mul_2_output_0 #/blocks.25/self_attn/Mul_3_output_0#/blocks.25/self_attn/Add_1_output_0/blocks.25/self_attn/Add_1"Add  /Gather_25_output_0 /rotary/Constant_3_output_0&/blocks.25/self_attn/Gather_4_output_0/blocks.25/self_attn/Gather_4"Gather* axis  /Gather_25_output_0 /rotary/Constant_8_output_0&/blocks.25/self_attn/Gather_5_output_0/blocks.25/self_attn/Gather_5"Gather* axis  &/blocks.25/self_attn/Gather_4_output_0 #/blocks.25/self_attn/Add_1_output_0&/blocks.25/self_attn/Concat_5_output_0/blocks.25/self_attn/Concat_5"Concat* axis  &/blocks.25/self_attn/Gather_5_output_0 '/blocks.25/self_attn/Reshape_2_output_0&/blocks.25/self_attn/Concat_6_output_0/blocks.25/self_attn/Concat_6"Concat* axis )/blocks.25/self_attn/Constant_28_output_0 /blocks.25/self_attn/Constant_28"Constant*H value*<B,/blocks.25/self_attn/Constant_28_attr::valueJ  &/blocks.25/self_attn/Concat_5_output_0 )/blocks.25/self_attn/Constant_28_output_0*/blocks.25/self_attn/Unsqueeze_10_output_0!/blocks.25/self_attn/Unsqueeze_10" Unsqueeze )/blocks.25/self_attn/Constant_29_output_0 /blocks.25/self_attn/Constant_29"Constant*H value*<B,/blocks.25/self_attn/Constant_29_attr::valueJ  &/blocks.25/self_attn/Concat_6_output_0 )/blocks.25/self_attn/Constant_29_output_0*/blocks.25/self_attn/Unsqueeze_11_output_0!/blocks.25/self_attn/Unsqueeze_11" Unsqueeze  */blocks.25/self_attn/Unsqueeze_10_output_0 */blocks.25/self_attn/Unsqueeze_11_output_0&/blocks.25/self_attn/Concat_7_output_0/blocks.25/self_attn/Concat_7"Concat* axis  !/blocks.25/self_attn/Add_output_0'/blocks.25/self_attn/Transpose_output_0/blocks.25/self_attn/Transpose" Transpose* perm@@@@  &/blocks.25/self_attn/Concat_5_output_0)/blocks.25/self_attn/Transpose_1_output_0 /blocks.25/self_attn/Transpose_1" Transpose* perm@@@@  &/blocks.25/self_attn/Concat_6_output_0)/blocks.25/self_attn/Transpose_2_output_0 /blocks.25/self_attn/Transpose_2" Transpose* perm@@@@ w )/blocks.25/self_attn/Transpose_1_output_0%/blocks.25/self_attn/Shape_4_output_0/blocks.25/self_attn/Shape_4"Shape )/blocks.25/self_attn/Constant_30_output_0 /blocks.25/self_attn/Constant_30"Constant*F value*:B,/blocks.25/self_attn/Constant_30_attr::valueJ  %/blocks.25/self_attn/Shape_4_output_0 )/blocks.25/self_attn/Constant_30_output_0&/blocks.25/self_attn/Gather_6_output_0/blocks.25/self_attn/Gather_6"Gather* axis w )/blocks.25/self_attn/Transpose_1_output_0%/blocks.25/self_attn/Shape_5_output_0/blocks.25/self_attn/Shape_5"Shape )/blocks.25/self_attn/Constant_31_output_0 /blocks.25/self_attn/Constant_31"Constant*F value*:B,/blocks.25/self_attn/Constant_31_attr::valueJ  %/blocks.25/self_attn/Shape_5_output_0 )/blocks.25/self_attn/Constant_31_output_0&/blocks.25/self_attn/Gather_7_output_0/blocks.25/self_attn/Gather_7"Gather* axis w )/blocks.25/self_attn/Transpose_1_output_0%/blocks.25/self_attn/Shape_6_output_0/blocks.25/self_attn/Shape_6"Shape )/blocks.25/self_attn/Constant_32_output_0 /blocks.25/self_attn/Constant_32"Constant*F value*:B,/blocks.25/self_attn/Constant_32_attr::valueJ  %/blocks.25/self_attn/Shape_6_output_0 )/blocks.25/self_attn/Constant_32_output_0&/blocks.25/self_attn/Gather_8_output_0/blocks.25/self_attn/Gather_8"Gather* axis w )/blocks.25/self_attn/Transpose_1_output_0%/blocks.25/self_attn/Shape_7_output_0/blocks.25/self_attn/Shape_7"Shape )/blocks.25/self_attn/Constant_33_output_0 /blocks.25/self_attn/Constant_33"Constant*F value*:B,/blocks.25/self_attn/Constant_33_attr::valueJ  %/blocks.25/self_attn/Shape_7_output_0 )/blocks.25/self_attn/Constant_33_output_0&/blocks.25/self_attn/Gather_9_output_0/blocks.25/self_attn/Gather_9"Gather* axis )/blocks.25/self_attn/Constant_34_output_0 /blocks.25/self_attn/Constant_34"Constant*H value*<B,/blocks.25/self_attn/Constant_34_attr::valueJ  )/blocks.25/self_attn/Transpose_1_output_0 )/blocks.25/self_attn/Constant_34_output_0*/blocks.25/self_attn/Unsqueeze_12_output_0!/blocks.25/self_attn/Unsqueeze_12" Unsqueeze )/blocks.25/self_attn/Constant_35_output_0 /blocks.25/self_attn/Constant_35"Constant*H value*<B,/blocks.25/self_attn/Constant_35_attr::valueJ  &/blocks.25/self_attn/Gather_6_output_0 )/blocks.25/self_attn/Constant_35_output_0*/blocks.25/self_attn/Unsqueeze_13_output_0!/blocks.25/self_attn/Unsqueeze_13" Unsqueeze )/blocks.25/self_attn/Constant_36_output_0 /blocks.25/self_attn/Constant_36"Constant*H value*<B,/blocks.25/self_attn/Constant_36_attr::valueJ  &/blocks.25/self_attn/Gather_7_output_0 )/blocks.25/self_attn/Constant_36_output_0*/blocks.25/self_attn/Unsqueeze_14_output_0!/blocks.25/self_attn/Unsqueeze_14" Unsqueeze )/blocks.25/self_attn/Constant_37_output_0 /blocks.25/self_attn/Constant_37"Constant*H value*<B,/blocks.25/self_attn/Constant_37_attr::valueJ )/blocks.25/self_attn/Constant_38_output_0 /blocks.25/self_attn/Constant_38"Constant*H value*<B,/blocks.25/self_attn/Constant_38_attr::valueJ  &/blocks.25/self_attn/Gather_8_output_0 )/blocks.25/self_attn/Constant_38_output_0*/blocks.25/self_attn/Unsqueeze_15_output_0!/blocks.25/self_attn/Unsqueeze_15" Unsqueeze )/blocks.25/self_attn/Constant_39_output_0 /blocks.25/self_attn/Constant_39"Constant*H value*<B,/blocks.25/self_attn/Constant_39_attr::valueJ  &/blocks.25/self_attn/Gather_9_output_0 )/blocks.25/self_attn/Constant_39_output_0*/blocks.25/self_attn/Unsqueeze_16_output_0!/blocks.25/self_attn/Unsqueeze_16" Unsqueeze  */blocks.25/self_attn/Unsqueeze_13_output_0 */blocks.25/self_attn/Unsqueeze_14_output_0 )/blocks.25/self_attn/Constant_37_output_0 */blocks.25/self_attn/Unsqueeze_15_output_0 */blocks.25/self_attn/Unsqueeze_16_output_0&/blocks.25/self_attn/Concat_8_output_0/blocks.25/self_attn/Concat_8"Concat* axis )/blocks.25/self_attn/Constant_40_output_0 /blocks.25/self_attn/Constant_40"Constant*H value*<B,/blocks.25/self_attn/Constant_40_attr::valueJ  &/blocks.25/self_attn/Concat_8_output_0 )/blocks.25/self_attn/Constant_40_output_0'/blocks.25/self_attn/Reshape_3_output_0/blocks.25/self_attn/Reshape_3"Reshape* allowzero u '/blocks.25/self_attn/Reshape_3_output_0%/blocks.25/self_attn/Shape_8_output_0/blocks.25/self_attn/Shape_8"Shape  %/blocks.25/self_attn/Shape_8_output_0-/blocks.25/self_attn/ConstantOfShape_output_0$/blocks.25/self_attn/ConstantOfShape"ConstantOfShape*L value*@B0/blocks.25/self_attn/ConstantOfShape_attr::valueJ )/blocks.25/self_attn/Constant_41_output_0 /blocks.25/self_attn/Constant_41"Constant*F value*:B,/blocks.25/self_attn/Constant_41_attr::valueJ  -/blocks.25/self_attn/ConstantOfShape_output_0 )/blocks.25/self_attn/Constant_41_output_0#/blocks.25/self_attn/Mul_4_output_0/blocks.25/self_attn/Mul_4"Mul  '/blocks.25/self_attn/Reshape_3_output_0 #/blocks.25/self_attn/Mul_4_output_0#/blocks.25/self_attn/Equal_output_0/blocks.25/self_attn/Equal"Equal  #/blocks.25/self_attn/Equal_output_0 -/blocks.25/self_attn/ConstantOfShape_output_0 '/blocks.25/self_attn/Reshape_3_output_0#/blocks.25/self_attn/Where_output_0/blocks.25/self_attn/Where"Where  */blocks.25/self_attn/Unsqueeze_12_output_0 #/blocks.25/self_attn/Where_output_0$/blocks.25/self_attn/Expand_output_0/blocks.25/self_attn/Expand"Expand )/blocks.25/self_attn/Constant_42_output_0 /blocks.25/self_attn/Constant_42"Constant*F value*:B,/blocks.25/self_attn/Constant_42_attr::valueJ  &/blocks.25/self_attn/Gather_7_output_0 )/blocks.25/self_attn/Constant_42_output_0#/blocks.25/self_attn/Mul_5_output_0/blocks.25/self_attn/Mul_5"Mul fonnx::Unsqueeze_7806 Constant_9269"Constant*5 value*)BConstant_9269_attr::valueJ  &/blocks.25/self_attn/Gather_6_output_0 onnx::Unsqueeze_7806*/blocks.25/self_attn/Unsqueeze_17_output_0!/blocks.25/self_attn/Unsqueeze_17" Unsqueeze fonnx::Unsqueeze_7808 Constant_9271"Constant*5 value*)BConstant_9271_attr::valueJ  #/blocks.25/self_attn/Mul_5_output_0 onnx::Unsqueeze_7808*/blocks.25/self_attn/Unsqueeze_18_output_0!/blocks.25/self_attn/Unsqueeze_18" Unsqueeze fonnx::Unsqueeze_7810 Constant_9273"Constant*5 value*)BConstant_9273_attr::valueJ  &/blocks.25/self_attn/Gather_8_output_0 onnx::Unsqueeze_7810*/blocks.25/self_attn/Unsqueeze_19_output_0!/blocks.25/self_attn/Unsqueeze_19" Unsqueeze fonnx::Unsqueeze_7812 Constant_9275"Constant*5 value*)BConstant_9275_attr::valueJ  &/blocks.25/self_attn/Gather_9_output_0 onnx::Unsqueeze_7812*/blocks.25/self_attn/Unsqueeze_20_output_0!/blocks.25/self_attn/Unsqueeze_20" Unsqueeze  */blocks.25/self_attn/Unsqueeze_17_output_0 */blocks.25/self_attn/Unsqueeze_18_output_0 */blocks.25/self_attn/Unsqueeze_19_output_0 */blocks.25/self_attn/Unsqueeze_20_output_0&/blocks.25/self_attn/Concat_9_output_0/blocks.25/self_attn/Concat_9"Concat* axis  $/blocks.25/self_attn/Expand_output_0 &/blocks.25/self_attn/Concat_9_output_0'/blocks.25/self_attn/Reshape_4_output_0/blocks.25/self_attn/Reshape_4"Reshape* allowzero w )/blocks.25/self_attn/Transpose_2_output_0%/blocks.25/self_attn/Shape_9_output_0/blocks.25/self_attn/Shape_9"Shape )/blocks.25/self_attn/Constant_43_output_0 /blocks.25/self_attn/Constant_43"Constant*F value*:B,/blocks.25/self_attn/Constant_43_attr::valueJ  %/blocks.25/self_attn/Shape_9_output_0 )/blocks.25/self_attn/Constant_43_output_0'/blocks.25/self_attn/Gather_10_output_0/blocks.25/self_attn/Gather_10"Gather* axis y )/blocks.25/self_attn/Transpose_2_output_0&/blocks.25/self_attn/Shape_10_output_0/blocks.25/self_attn/Shape_10"Shape )/blocks.25/self_attn/Constant_44_output_0 /blocks.25/self_attn/Constant_44"Constant*F value*:B,/blocks.25/self_attn/Constant_44_attr::valueJ  &/blocks.25/self_attn/Shape_10_output_0 )/blocks.25/self_attn/Constant_44_output_0'/blocks.25/self_attn/Gather_11_output_0/blocks.25/self_attn/Gather_11"Gather* axis y )/blocks.25/self_attn/Transpose_2_output_0&/blocks.25/self_attn/Shape_11_output_0/blocks.25/self_attn/Shape_11"Shape )/blocks.25/self_attn/Constant_45_output_0 /blocks.25/self_attn/Constant_45"Constant*F value*:B,/blocks.25/self_attn/Constant_45_attr::valueJ  &/blocks.25/self_attn/Shape_11_output_0 )/blocks.25/self_attn/Constant_45_output_0'/blocks.25/self_attn/Gather_12_output_0/blocks.25/self_attn/Gather_12"Gather* axis y )/blocks.25/self_attn/Transpose_2_output_0&/blocks.25/self_attn/Shape_12_output_0/blocks.25/self_attn/Shape_12"Shape )/blocks.25/self_attn/Constant_46_output_0 /blocks.25/self_attn/Constant_46"Constant*F value*:B,/blocks.25/self_attn/Constant_46_attr::valueJ  &/blocks.25/self_attn/Shape_12_output_0 )/blocks.25/self_attn/Constant_46_output_0'/blocks.25/self_attn/Gather_13_output_0/blocks.25/self_attn/Gather_13"Gather* axis )/blocks.25/self_attn/Constant_47_output_0 /blocks.25/self_attn/Constant_47"Constant*H value*<B,/blocks.25/self_attn/Constant_47_attr::valueJ  )/blocks.25/self_attn/Transpose_2_output_0 )/blocks.25/self_attn/Constant_47_output_0*/blocks.25/self_attn/Unsqueeze_21_output_0!/blocks.25/self_attn/Unsqueeze_21" Unsqueeze )/blocks.25/self_attn/Constant_48_output_0 /blocks.25/self_attn/Constant_48"Constant*H value*<B,/blocks.25/self_attn/Constant_48_attr::valueJ  '/blocks.25/self_attn/Gather_10_output_0 )/blocks.25/self_attn/Constant_48_output_0*/blocks.25/self_attn/Unsqueeze_22_output_0!/blocks.25/self_attn/Unsqueeze_22" Unsqueeze )/blocks.25/self_attn/Constant_49_output_0 /blocks.25/self_attn/Constant_49"Constant*H value*<B,/blocks.25/self_attn/Constant_49_attr::valueJ  '/blocks.25/self_attn/Gather_11_output_0 )/blocks.25/self_attn/Constant_49_output_0*/blocks.25/self_attn/Unsqueeze_23_output_0!/blocks.25/self_attn/Unsqueeze_23" Unsqueeze )/blocks.25/self_attn/Constant_50_output_0 /blocks.25/self_attn/Constant_50"Constant*H value*<B,/blocks.25/self_attn/Constant_50_attr::valueJ )/blocks.25/self_attn/Constant_51_output_0 /blocks.25/self_attn/Constant_51"Constant*H value*<B,/blocks.25/self_attn/Constant_51_attr::valueJ  '/blocks.25/self_attn/Gather_12_output_0 )/blocks.25/self_attn/Constant_51_output_0*/blocks.25/self_attn/Unsqueeze_24_output_0!/blocks.25/self_attn/Unsqueeze_24" Unsqueeze )/blocks.25/self_attn/Constant_52_output_0 /blocks.25/self_attn/Constant_52"Constant*H value*<B,/blocks.25/self_attn/Constant_52_attr::valueJ  '/blocks.25/self_attn/Gather_13_output_0 )/blocks.25/self_attn/Constant_52_output_0*/blocks.25/self_attn/Unsqueeze_25_output_0!/blocks.25/self_attn/Unsqueeze_25" Unsqueeze  */blocks.25/self_attn/Unsqueeze_22_output_0 */blocks.25/self_attn/Unsqueeze_23_output_0 )/blocks.25/self_attn/Constant_50_output_0 */blocks.25/self_attn/Unsqueeze_24_output_0 */blocks.25/self_attn/Unsqueeze_25_output_0'/blocks.25/self_attn/Concat_10_output_0/blocks.25/self_attn/Concat_10"Concat* axis )/blocks.25/self_attn/Constant_53_output_0 /blocks.25/self_attn/Constant_53"Constant*H value*<B,/blocks.25/self_attn/Constant_53_attr::valueJ  '/blocks.25/self_attn/Concat_10_output_0 )/blocks.25/self_attn/Constant_53_output_0'/blocks.25/self_attn/Reshape_5_output_0/blocks.25/self_attn/Reshape_5"Reshape* allowzero w '/blocks.25/self_attn/Reshape_5_output_0&/blocks.25/self_attn/Shape_13_output_0/blocks.25/self_attn/Shape_13"Shape  &/blocks.25/self_attn/Shape_13_output_0//blocks.25/self_attn/ConstantOfShape_1_output_0&/blocks.25/self_attn/ConstantOfShape_1"ConstantOfShape*N value*BB2/blocks.25/self_attn/ConstantOfShape_1_attr::valueJ )/blocks.25/self_attn/Constant_54_output_0 /blocks.25/self_attn/Constant_54"Constant*F value*:B,/blocks.25/self_attn/Constant_54_attr::valueJ  //blocks.25/self_attn/ConstantOfShape_1_output_0 )/blocks.25/self_attn/Constant_54_output_0#/blocks.25/self_attn/Mul_6_output_0/blocks.25/self_attn/Mul_6"Mul  '/blocks.25/self_attn/Reshape_5_output_0 #/blocks.25/self_attn/Mul_6_output_0%/blocks.25/self_attn/Equal_1_output_0/blocks.25/self_attn/Equal_1"Equal  %/blocks.25/self_attn/Equal_1_output_0 //blocks.25/self_attn/ConstantOfShape_1_output_0 '/blocks.25/self_attn/Reshape_5_output_0%/blocks.25/self_attn/Where_1_output_0/blocks.25/self_attn/Where_1"Where  */blocks.25/self_attn/Unsqueeze_21_output_0 %/blocks.25/self_attn/Where_1_output_0&/blocks.25/self_attn/Expand_1_output_0/blocks.25/self_attn/Expand_1"Expand )/blocks.25/self_attn/Constant_55_output_0 /blocks.25/self_attn/Constant_55"Constant*F value*:B,/blocks.25/self_attn/Constant_55_attr::valueJ  '/blocks.25/self_attn/Gather_11_output_0 )/blocks.25/self_attn/Constant_55_output_0#/blocks.25/self_attn/Mul_7_output_0/blocks.25/self_attn/Mul_7"Mul fonnx::Unsqueeze_7852 Constant_9314"Constant*5 value*)BConstant_9314_attr::valueJ  '/blocks.25/self_attn/Gather_10_output_0 onnx::Unsqueeze_7852*/blocks.25/self_attn/Unsqueeze_26_output_0!/blocks.25/self_attn/Unsqueeze_26" Unsqueeze fonnx::Unsqueeze_7854 Constant_9316"Constant*5 value*)BConstant_9316_attr::valueJ  #/blocks.25/self_attn/Mul_7_output_0 onnx::Unsqueeze_7854*/blocks.25/self_attn/Unsqueeze_27_output_0!/blocks.25/self_attn/Unsqueeze_27" Unsqueeze fonnx::Unsqueeze_7856 Constant_9318"Constant*5 value*)BConstant_9318_attr::valueJ  '/blocks.25/self_attn/Gather_12_output_0 onnx::Unsqueeze_7856*/blocks.25/self_attn/Unsqueeze_28_output_0!/blocks.25/self_attn/Unsqueeze_28" Unsqueeze fonnx::Unsqueeze_7858 Constant_9320"Constant*5 value*)BConstant_9320_attr::valueJ  '/blocks.25/self_attn/Gather_13_output_0 onnx::Unsqueeze_7858*/blocks.25/self_attn/Unsqueeze_29_output_0!/blocks.25/self_attn/Unsqueeze_29" Unsqueeze  */blocks.25/self_attn/Unsqueeze_26_output_0 */blocks.25/self_attn/Unsqueeze_27_output_0 */blocks.25/self_attn/Unsqueeze_28_output_0 */blocks.25/self_attn/Unsqueeze_29_output_0'/blocks.25/self_attn/Concat_11_output_0/blocks.25/self_attn/Concat_11"Concat* axis  &/blocks.25/self_attn/Expand_1_output_0 '/blocks.25/self_attn/Concat_11_output_0'/blocks.25/self_attn/Reshape_6_output_0/blocks.25/self_attn/Reshape_6"Reshape* allowzero  '/blocks.25/self_attn/Transpose_output_0 '/blocks.25/self_attn/Reshape_4_output_0$/blocks.25/self_attn/MatMul_output_0/blocks.25/self_attn/MatMul"MatMul )/blocks.25/self_attn/Constant_56_output_0 /blocks.25/self_attn/Constant_56"Constant*B value*6B,/blocks.25/self_attn/Constant_56_attr::valueJ5A  $/blocks.25/self_attn/MatMul_output_0 )/blocks.25/self_attn/Constant_56_output_0#/blocks.25/self_attn/Div_2_output_0/blocks.25/self_attn/Div_2"Div { #/blocks.25/self_attn/Div_2_output_0 attention_mask#/blocks.25/self_attn/Add_2_output_0/blocks.25/self_attn/Add_2"Add  #/blocks.25/self_attn/Add_2_output_0%/blocks.25/self_attn/Softmax_output_0/blocks.25/self_attn/Softmax"Softmax* axis { %/blocks.25/self_attn/Softmax_output_0$/blocks.25/self_attn/Cast_4_output_0/blocks.25/self_attn/Cast_4"Cast* to  $/blocks.25/self_attn/Cast_4_output_0 '/blocks.25/self_attn/Reshape_6_output_0&/blocks.25/self_attn/MatMul_1_output_0/blocks.25/self_attn/MatMul_1"MatMul  &/blocks.25/self_attn/MatMul_1_output_0)/blocks.25/self_attn/Transpose_3_output_0 /blocks.25/self_attn/Transpose_3" Transpose* perm@@@@ fonnx::Unsqueeze_7870 Constant_9332"Constant*5 value*)BConstant_9332_attr::valueJ  $/blocks.25/self_attn/Gather_output_0 onnx::Unsqueeze_7870*/blocks.25/self_attn/Unsqueeze_30_output_0!/blocks.25/self_attn/Unsqueeze_30" Unsqueeze fonnx::Unsqueeze_7872 Constant_9334"Constant*5 value*)BConstant_9334_attr::valueJ  &/blocks.25/self_attn/Gather_1_output_0 onnx::Unsqueeze_7872*/blocks.25/self_attn/Unsqueeze_31_output_0!/blocks.25/self_attn/Unsqueeze_31" Unsqueeze )/blocks.25/self_attn/Constant_57_output_0 /blocks.25/self_attn/Constant_57"Constant*H value*<B,/blocks.25/self_attn/Constant_57_attr::valueJ  */blocks.25/self_attn/Unsqueeze_30_output_0 */blocks.25/self_attn/Unsqueeze_31_output_0 )/blocks.25/self_attn/Constant_57_output_0'/blocks.25/self_attn/Concat_12_output_0/blocks.25/self_attn/Concat_12"Concat* axis  )/blocks.25/self_attn/Transpose_3_output_0 '/blocks.25/self_attn/Concat_12_output_0'/blocks.25/self_attn/Reshape_7_output_0/blocks.25/self_attn/Reshape_7"Reshape* allowzero  '/blocks.25/self_attn/Reshape_7_output_0 onnx::MatMul_9289+/blocks.25/self_attn/o_proj/MatMul_output_0"/blocks.25/self_attn/o_proj/MatMul"MatMul  */blocks.25/input_layernorm/Cast_1_output_0 +/blocks.25/self_attn/o_proj/MatMul_output_0/blocks.25/Add_output_0/blocks.25/Add"Add  /blocks.25/Add_output_01/blocks.25/post_attention_layernorm/Cast_output_0(/blocks.25/post_attention_layernorm/Cast"Cast* to 5/blocks.25/post_attention_layernorm/Constant_output_0,/blocks.25/post_attention_layernorm/Constant"Constant*N value*BB8/blocks.25/post_attention_layernorm/Constant_attr::valueJ@  1/blocks.25/post_attention_layernorm/Cast_output_0 5/blocks.25/post_attention_layernorm/Constant_output_00/blocks.25/post_attention_layernorm/Pow_output_0'/blocks.25/post_attention_layernorm/Pow"Pow  0/blocks.25/post_attention_layernorm/Pow_output_07/blocks.25/post_attention_layernorm/ReduceMean_output_0./blocks.25/post_attention_layernorm/ReduceMean" ReduceMean* axes@* keepdims 7/blocks.25/post_attention_layernorm/Constant_1_output_0./blocks.25/post_attention_layernorm/Constant_1"Constant*P value*DB:/blocks.25/post_attention_layernorm/Constant_1_attr::valueJ75  7/blocks.25/post_attention_layernorm/ReduceMean_output_0 7/blocks.25/post_attention_layernorm/Constant_1_output_00/blocks.25/post_attention_layernorm/Add_output_0'/blocks.25/post_attention_layernorm/Add"Add  0/blocks.25/post_attention_layernorm/Add_output_01/blocks.25/post_attention_layernorm/Sqrt_output_0(/blocks.25/post_attention_layernorm/Sqrt"Sqrt 7/blocks.25/post_attention_layernorm/Constant_2_output_0./blocks.25/post_attention_layernorm/Constant_2"Constant*P value*DB:/blocks.25/post_attention_layernorm/Constant_2_attr::valueJ?  7/blocks.25/post_attention_layernorm/Constant_2_output_0 1/blocks.25/post_attention_layernorm/Sqrt_output_00/blocks.25/post_attention_layernorm/Div_output_0'/blocks.25/post_attention_layernorm/Div"Div  1/blocks.25/post_attention_layernorm/Cast_output_03/blocks.25/post_attention_layernorm/Cast_1_output_0*/blocks.25/post_attention_layernorm/Cast_1"Cast* to  3/blocks.25/post_attention_layernorm/Cast_1_output_0 0/blocks.25/post_attention_layernorm/Div_output_00/blocks.25/post_attention_layernorm/Mul_output_0'/blocks.25/post_attention_layernorm/Mul"Mul  0/blocks.25/post_attention_layernorm/Mul_output_0 )blocks.25.post_attention_layernorm.weight2/blocks.25/post_attention_layernorm/Mul_1_output_0)/blocks.25/post_attention_layernorm/Mul_1"Mul  2/blocks.25/post_attention_layernorm/Mul_1_output_03/blocks.25/post_attention_layernorm/Cast_2_output_0*/blocks.25/post_attention_layernorm/Cast_2"Cast* to  3/blocks.25/post_attention_layernorm/Cast_2_output_0 onnx::MatMul_9290(/blocks.25/mlp/gate_proj/MatMul_output_0/blocks.25/mlp/gate_proj/MatMul"MatMul z (/blocks.25/mlp/gate_proj/MatMul_output_0&/blocks.25/mlp/act_fn/Sigmoid_output_0/blocks.25/mlp/act_fn/Sigmoid"Sigmoid  (/blocks.25/mlp/gate_proj/MatMul_output_0 &/blocks.25/mlp/act_fn/Sigmoid_output_0"/blocks.25/mlp/act_fn/Mul_output_0/blocks.25/mlp/act_fn/Mul"Mul  3/blocks.25/post_attention_layernorm/Cast_2_output_0 onnx::MatMul_9291&/blocks.25/mlp/up_proj/MatMul_output_0/blocks.25/mlp/up_proj/MatMul"MatMul  "/blocks.25/mlp/act_fn/Mul_output_0 &/blocks.25/mlp/up_proj/MatMul_output_0/blocks.25/mlp/Mul_output_0/blocks.25/mlp/Mul"Mul  /blocks.25/mlp/Mul_output_0 onnx::MatMul_9292(/blocks.25/mlp/down_proj/MatMul_output_0/blocks.25/mlp/down_proj/MatMul"MatMul  3/blocks.25/post_attention_layernorm/Cast_1_output_0 (/blocks.25/mlp/down_proj/MatMul_output_0/blocks.25/Add_1_output_0/blocks.25/Add_1"Add c/Constant_18_output_0 /Constant_18"Constant*2 value*&B/Constant_18_attr::valueJ ^ past_key_values /Constant_18_output_0/Gather_26_output_0 /Gather_26"Gather* axis /blocks.26/Constant_output_0/blocks.26/Constant"Constant*K value*?B/blocks.26/Constant_attr::valueJ  /blocks.25/Add_1_output_0 /blocks.26/Constant_output_0/blocks.26/Reshape_output_0/blocks.26/Reshape"Reshape* allowzero y /blocks.26/Reshape_output_0(/blocks.26/input_layernorm/Cast_output_0/blocks.26/input_layernorm/Cast"Cast* to ,/blocks.26/input_layernorm/Constant_output_0#/blocks.26/input_layernorm/Constant"Constant*E value*9B//blocks.26/input_layernorm/Constant_attr::valueJ@  (/blocks.26/input_layernorm/Cast_output_0 ,/blocks.26/input_layernorm/Constant_output_0'/blocks.26/input_layernorm/Pow_output_0/blocks.26/input_layernorm/Pow"Pow  '/blocks.26/input_layernorm/Pow_output_0./blocks.26/input_layernorm/ReduceMean_output_0%/blocks.26/input_layernorm/ReduceMean" ReduceMean* axes@* keepdims ./blocks.26/input_layernorm/Constant_1_output_0%/blocks.26/input_layernorm/Constant_1"Constant*G value*;B1/blocks.26/input_layernorm/Constant_1_attr::valueJ75  ./blocks.26/input_layernorm/ReduceMean_output_0 ./blocks.26/input_layernorm/Constant_1_output_0'/blocks.26/input_layernorm/Add_output_0/blocks.26/input_layernorm/Add"Add z '/blocks.26/input_layernorm/Add_output_0(/blocks.26/input_layernorm/Sqrt_output_0/blocks.26/input_layernorm/Sqrt"Sqrt ./blocks.26/input_layernorm/Constant_2_output_0%/blocks.26/input_layernorm/Constant_2"Constant*G value*;B1/blocks.26/input_layernorm/Constant_2_attr::valueJ?  ./blocks.26/input_layernorm/Constant_2_output_0 (/blocks.26/input_layernorm/Sqrt_output_0'/blocks.26/input_layernorm/Div_output_0/blocks.26/input_layernorm/Div"Div  (/blocks.26/input_layernorm/Cast_output_0*/blocks.26/input_layernorm/Cast_1_output_0!/blocks.26/input_layernorm/Cast_1"Cast* to  */blocks.26/input_layernorm/Cast_1_output_0 '/blocks.26/input_layernorm/Div_output_0'/blocks.26/input_layernorm/Mul_output_0/blocks.26/input_layernorm/Mul"Mul  '/blocks.26/input_layernorm/Mul_output_0 blocks.26.input_layernorm.weight)/blocks.26/input_layernorm/Mul_1_output_0 /blocks.26/input_layernorm/Mul_1"Mul  )/blocks.26/input_layernorm/Mul_1_output_0*/blocks.26/input_layernorm/Cast_2_output_0!/blocks.26/input_layernorm/Cast_2"Cast* to t */blocks.26/input_layernorm/Cast_2_output_0#/blocks.26/self_attn/Shape_output_0/blocks.26/self_attn/Shape"Shape &/blocks.26/self_attn/Constant_output_0/blocks.26/self_attn/Constant"Constant*C value*7B)/blocks.26/self_attn/Constant_attr::valueJ  #/blocks.26/self_attn/Shape_output_0 &/blocks.26/self_attn/Constant_output_0$/blocks.26/self_attn/Gather_output_0/blocks.26/self_attn/Gather"Gather* axis x */blocks.26/input_layernorm/Cast_2_output_0%/blocks.26/self_attn/Shape_1_output_0/blocks.26/self_attn/Shape_1"Shape (/blocks.26/self_attn/Constant_1_output_0/blocks.26/self_attn/Constant_1"Constant*E value*9B+/blocks.26/self_attn/Constant_1_attr::valueJ  %/blocks.26/self_attn/Shape_1_output_0 (/blocks.26/self_attn/Constant_1_output_0&/blocks.26/self_attn/Gather_1_output_0/blocks.26/self_attn/Gather_1"Gather* axis  */blocks.26/input_layernorm/Cast_2_output_0 onnx::MatMul_9293+/blocks.26/self_attn/q_proj/MatMul_output_0"/blocks.26/self_attn/q_proj/MatMul"MatMul  */blocks.26/input_layernorm/Cast_2_output_0 onnx::MatMul_9294+/blocks.26/self_attn/k_proj/MatMul_output_0"/blocks.26/self_attn/k_proj/MatMul"MatMul  */blocks.26/input_layernorm/Cast_2_output_0 onnx::MatMul_9295+/blocks.26/self_attn/v_proj/MatMul_output_0"/blocks.26/self_attn/v_proj/MatMul"MatMul fonnx::Unsqueeze_7933 Constant_9387"Constant*5 value*)BConstant_9387_attr::valueJ  $/blocks.26/self_attn/Gather_output_0 onnx::Unsqueeze_7933'/blocks.26/self_attn/Unsqueeze_output_0/blocks.26/self_attn/Unsqueeze" Unsqueeze fonnx::Unsqueeze_7935 Constant_9389"Constant*5 value*)BConstant_9389_attr::valueJ  &/blocks.26/self_attn/Gather_1_output_0 onnx::Unsqueeze_7935)/blocks.26/self_attn/Unsqueeze_1_output_0 /blocks.26/self_attn/Unsqueeze_1" Unsqueeze (/blocks.26/self_attn/Constant_2_output_0/blocks.26/self_attn/Constant_2"Constant*G value*;B+/blocks.26/self_attn/Constant_2_attr::valueJ (/blocks.26/self_attn/Constant_3_output_0/blocks.26/self_attn/Constant_3"Constant*G value*;B+/blocks.26/self_attn/Constant_3_attr::valueJ  '/blocks.26/self_attn/Unsqueeze_output_0 )/blocks.26/self_attn/Unsqueeze_1_output_0 (/blocks.26/self_attn/Constant_2_output_0 (/blocks.26/self_attn/Constant_3_output_0$/blocks.26/self_attn/Concat_output_0/blocks.26/self_attn/Concat"Concat* axis  +/blocks.26/self_attn/q_proj/MatMul_output_0 $/blocks.26/self_attn/Concat_output_0%/blocks.26/self_attn/Reshape_output_0/blocks.26/self_attn/Reshape"Reshape* allowzero fonnx::Unsqueeze_7943 Constant_9395"Constant*5 value*)BConstant_9395_attr::valueJ  $/blocks.26/self_attn/Gather_output_0 onnx::Unsqueeze_7943)/blocks.26/self_attn/Unsqueeze_2_output_0 /blocks.26/self_attn/Unsqueeze_2" Unsqueeze fonnx::Unsqueeze_7945 Constant_9397"Constant*5 value*)BConstant_9397_attr::valueJ  &/blocks.26/self_attn/Gather_1_output_0 onnx::Unsqueeze_7945)/blocks.26/self_attn/Unsqueeze_3_output_0 /blocks.26/self_attn/Unsqueeze_3" Unsqueeze (/blocks.26/self_attn/Constant_4_output_0/blocks.26/self_attn/Constant_4"Constant*G value*;B+/blocks.26/self_attn/Constant_4_attr::valueJ (/blocks.26/self_attn/Constant_5_output_0/blocks.26/self_attn/Constant_5"Constant*G value*;B+/blocks.26/self_attn/Constant_5_attr::valueJ  )/blocks.26/self_attn/Unsqueeze_2_output_0 )/blocks.26/self_attn/Unsqueeze_3_output_0 (/blocks.26/self_attn/Constant_4_output_0 (/blocks.26/self_attn/Constant_5_output_0&/blocks.26/self_attn/Concat_1_output_0/blocks.26/self_attn/Concat_1"Concat* axis fonnx::Unsqueeze_7952 Constant_9402"Constant*5 value*)BConstant_9402_attr::valueJ  $/blocks.26/self_attn/Gather_output_0 onnx::Unsqueeze_7952)/blocks.26/self_attn/Unsqueeze_4_output_0 /blocks.26/self_attn/Unsqueeze_4" Unsqueeze fonnx::Unsqueeze_7954 Constant_9404"Constant*5 value*)BConstant_9404_attr::valueJ  &/blocks.26/self_attn/Gather_1_output_0 onnx::Unsqueeze_7954)/blocks.26/self_attn/Unsqueeze_5_output_0 /blocks.26/self_attn/Unsqueeze_5" Unsqueeze (/blocks.26/self_attn/Constant_6_output_0/blocks.26/self_attn/Constant_6"Constant*G value*;B+/blocks.26/self_attn/Constant_6_attr::valueJ (/blocks.26/self_attn/Constant_7_output_0/blocks.26/self_attn/Constant_7"Constant*G value*;B+/blocks.26/self_attn/Constant_7_attr::valueJ  )/blocks.26/self_attn/Unsqueeze_4_output_0 )/blocks.26/self_attn/Unsqueeze_5_output_0 (/blocks.26/self_attn/Constant_6_output_0 (/blocks.26/self_attn/Constant_7_output_0&/blocks.26/self_attn/Concat_2_output_0/blocks.26/self_attn/Concat_2"Concat* axis  +/blocks.26/self_attn/k_proj/MatMul_output_0 &/blocks.26/self_attn/Concat_1_output_0'/blocks.26/self_attn/Reshape_1_output_0/blocks.26/self_attn/Reshape_1"Reshape* allowzero  +/blocks.26/self_attn/v_proj/MatMul_output_0 &/blocks.26/self_attn/Concat_2_output_0'/blocks.26/self_attn/Reshape_2_output_0/blocks.26/self_attn/Reshape_2"Reshape* allowzero  %/blocks.26/self_attn/Reshape_output_0)/blocks.26/self_attn/q_norm/Cast_output_0 /blocks.26/self_attn/q_norm/Cast"Cast* to -/blocks.26/self_attn/q_norm/Constant_output_0$/blocks.26/self_attn/q_norm/Constant"Constant*F value*:B0/blocks.26/self_attn/q_norm/Constant_attr::valueJ@  )/blocks.26/self_attn/q_norm/Cast_output_0 -/blocks.26/self_attn/q_norm/Constant_output_0(/blocks.26/self_attn/q_norm/Pow_output_0/blocks.26/self_attn/q_norm/Pow"Pow  (/blocks.26/self_attn/q_norm/Pow_output_0//blocks.26/self_attn/q_norm/ReduceMean_output_0&/blocks.26/self_attn/q_norm/ReduceMean" ReduceMean* axes@* keepdims //blocks.26/self_attn/q_norm/Constant_1_output_0&/blocks.26/self_attn/q_norm/Constant_1"Constant*H value*<B2/blocks.26/self_attn/q_norm/Constant_1_attr::valueJ75  //blocks.26/self_attn/q_norm/ReduceMean_output_0 //blocks.26/self_attn/q_norm/Constant_1_output_0(/blocks.26/self_attn/q_norm/Add_output_0/blocks.26/self_attn/q_norm/Add"Add } (/blocks.26/self_attn/q_norm/Add_output_0)/blocks.26/self_attn/q_norm/Sqrt_output_0 /blocks.26/self_attn/q_norm/Sqrt"Sqrt //blocks.26/self_attn/q_norm/Constant_2_output_0&/blocks.26/self_attn/q_norm/Constant_2"Constant*H value*<B2/blocks.26/self_attn/q_norm/Constant_2_attr::valueJ?  //blocks.26/self_attn/q_norm/Constant_2_output_0 )/blocks.26/self_attn/q_norm/Sqrt_output_0(/blocks.26/self_attn/q_norm/Div_output_0/blocks.26/self_attn/q_norm/Div"Div  )/blocks.26/self_attn/q_norm/Cast_output_0+/blocks.26/self_attn/q_norm/Cast_1_output_0"/blocks.26/self_attn/q_norm/Cast_1"Cast* to  +/blocks.26/self_attn/q_norm/Cast_1_output_0 (/blocks.26/self_attn/q_norm/Div_output_0(/blocks.26/self_attn/q_norm/Mul_output_0/blocks.26/self_attn/q_norm/Mul"Mul  (/blocks.26/self_attn/q_norm/Mul_output_0 !blocks.26.self_attn.q_norm.weight*/blocks.26/self_attn/q_norm/Mul_1_output_0!/blocks.26/self_attn/q_norm/Mul_1"Mul  */blocks.26/self_attn/q_norm/Mul_1_output_0+/blocks.26/self_attn/q_norm/Cast_2_output_0"/blocks.26/self_attn/q_norm/Cast_2"Cast* to  '/blocks.26/self_attn/Reshape_1_output_0)/blocks.26/self_attn/k_norm/Cast_output_0 /blocks.26/self_attn/k_norm/Cast"Cast* to -/blocks.26/self_attn/k_norm/Constant_output_0$/blocks.26/self_attn/k_norm/Constant"Constant*F value*:B0/blocks.26/self_attn/k_norm/Constant_attr::valueJ@  )/blocks.26/self_attn/k_norm/Cast_output_0 -/blocks.26/self_attn/k_norm/Constant_output_0(/blocks.26/self_attn/k_norm/Pow_output_0/blocks.26/self_attn/k_norm/Pow"Pow  (/blocks.26/self_attn/k_norm/Pow_output_0//blocks.26/self_attn/k_norm/ReduceMean_output_0&/blocks.26/self_attn/k_norm/ReduceMean" ReduceMean* axes@* keepdims //blocks.26/self_attn/k_norm/Constant_1_output_0&/blocks.26/self_attn/k_norm/Constant_1"Constant*H value*<B2/blocks.26/self_attn/k_norm/Constant_1_attr::valueJ75  //blocks.26/self_attn/k_norm/ReduceMean_output_0 //blocks.26/self_attn/k_norm/Constant_1_output_0(/blocks.26/self_attn/k_norm/Add_output_0/blocks.26/self_attn/k_norm/Add"Add } (/blocks.26/self_attn/k_norm/Add_output_0)/blocks.26/self_attn/k_norm/Sqrt_output_0 /blocks.26/self_attn/k_norm/Sqrt"Sqrt //blocks.26/self_attn/k_norm/Constant_2_output_0&/blocks.26/self_attn/k_norm/Constant_2"Constant*H value*<B2/blocks.26/self_attn/k_norm/Constant_2_attr::valueJ?  //blocks.26/self_attn/k_norm/Constant_2_output_0 )/blocks.26/self_attn/k_norm/Sqrt_output_0(/blocks.26/self_attn/k_norm/Div_output_0/blocks.26/self_attn/k_norm/Div"Div  )/blocks.26/self_attn/k_norm/Cast_output_0+/blocks.26/self_attn/k_norm/Cast_1_output_0"/blocks.26/self_attn/k_norm/Cast_1"Cast* to  +/blocks.26/self_attn/k_norm/Cast_1_output_0 (/blocks.26/self_attn/k_norm/Div_output_0(/blocks.26/self_attn/k_norm/Mul_output_0/blocks.26/self_attn/k_norm/Mul"Mul  (/blocks.26/self_attn/k_norm/Mul_output_0 !blocks.26.self_attn.k_norm.weight*/blocks.26/self_attn/k_norm/Mul_1_output_0!/blocks.26/self_attn/k_norm/Mul_1"Mul  */blocks.26/self_attn/k_norm/Mul_1_output_0+/blocks.26/self_attn/k_norm/Cast_2_output_0"/blocks.26/self_attn/k_norm/Cast_2"Cast* to  +/blocks.26/self_attn/q_norm/Cast_2_output_0 %/blocks.0/self_attn/Gather_2_output_0!/blocks.26/self_attn/Mul_output_0/blocks.26/self_attn/Mul"Mul y +/blocks.26/self_attn/q_norm/Cast_2_output_0%/blocks.26/self_attn/Shape_2_output_0/blocks.26/self_attn/Shape_2"Shape (/blocks.26/self_attn/Constant_8_output_0/blocks.26/self_attn/Constant_8"Constant*E value*9B+/blocks.26/self_attn/Constant_8_attr::valueJ  %/blocks.26/self_attn/Shape_2_output_0 (/blocks.26/self_attn/Constant_8_output_0&/blocks.26/self_attn/Gather_2_output_0/blocks.26/self_attn/Gather_2"Gather* axis (/blocks.26/self_attn/Constant_9_output_0/blocks.26/self_attn/Constant_9"Constant*E value*9B+/blocks.26/self_attn/Constant_9_attr::valueJ  &/blocks.26/self_attn/Gather_2_output_0 (/blocks.26/self_attn/Constant_9_output_0!/blocks.26/self_attn/Div_output_0/blocks.26/self_attn/Div"Div s !/blocks.26/self_attn/Div_output_0"/blocks.26/self_attn/Cast_output_0/blocks.26/self_attn/Cast"Cast* to x "/blocks.26/self_attn/Cast_output_0$/blocks.26/self_attn/Cast_1_output_0/blocks.26/self_attn/Cast_1"Cast* to )/blocks.26/self_attn/Constant_10_output_0 /blocks.26/self_attn/Constant_10"Constant*H value*<B,/blocks.26/self_attn/Constant_10_attr::valueJ )/blocks.26/self_attn/Constant_11_output_0 /blocks.26/self_attn/Constant_11"Constant*H value*<B,/blocks.26/self_attn/Constant_11_attr::valueJ )/blocks.26/self_attn/Constant_12_output_0 /blocks.26/self_attn/Constant_12"Constant*H value*<B,/blocks.26/self_attn/Constant_12_attr::valueJ  $/blocks.26/self_attn/Cast_1_output_0 )/blocks.26/self_attn/Constant_12_output_0)/blocks.26/self_attn/Unsqueeze_6_output_0 /blocks.26/self_attn/Unsqueeze_6" Unsqueeze )/blocks.26/self_attn/Constant_13_output_0 /blocks.26/self_attn/Constant_13"Constant*H value*<B,/blocks.26/self_attn/Constant_13_attr::valueJ  +/blocks.26/self_attn/q_norm/Cast_2_output_0 )/blocks.26/self_attn/Constant_11_output_0 )/blocks.26/self_attn/Unsqueeze_6_output_0 )/blocks.26/self_attn/Constant_10_output_0 )/blocks.26/self_attn/Constant_13_output_0#/blocks.26/self_attn/Slice_output_0/blocks.26/self_attn/Slice"Slice )/blocks.26/self_attn/Constant_14_output_0 /blocks.26/self_attn/Constant_14"Constant*H value*<B,/blocks.26/self_attn/Constant_14_attr::valueJ )/blocks.26/self_attn/Constant_15_output_0 /blocks.26/self_attn/Constant_15"Constant*H value*<B,/blocks.26/self_attn/Constant_15_attr::valueJ  $/blocks.26/self_attn/Cast_1_output_0 )/blocks.26/self_attn/Constant_15_output_0)/blocks.26/self_attn/Unsqueeze_7_output_0 /blocks.26/self_attn/Unsqueeze_7" Unsqueeze )/blocks.26/self_attn/Constant_16_output_0 /blocks.26/self_attn/Constant_16"Constant*H value*<B,/blocks.26/self_attn/Constant_16_attr::valueJ )/blocks.26/self_attn/Constant_17_output_0 /blocks.26/self_attn/Constant_17"Constant*H value*<B,/blocks.26/self_attn/Constant_17_attr::valueJ  +/blocks.26/self_attn/q_norm/Cast_2_output_0 )/blocks.26/self_attn/Unsqueeze_7_output_0 )/blocks.26/self_attn/Constant_16_output_0 )/blocks.26/self_attn/Constant_14_output_0 )/blocks.26/self_attn/Constant_17_output_0%/blocks.26/self_attn/Slice_1_output_0/blocks.26/self_attn/Slice_1"Slice i %/blocks.26/self_attn/Slice_1_output_0!/blocks.26/self_attn/Neg_output_0/blocks.26/self_attn/Neg"Neg  !/blocks.26/self_attn/Neg_output_0 #/blocks.26/self_attn/Slice_output_0&/blocks.26/self_attn/Concat_3_output_0/blocks.26/self_attn/Concat_3"Concat* axis  &/blocks.26/self_attn/Concat_3_output_0 %/blocks.0/self_attn/Gather_3_output_0#/blocks.26/self_attn/Mul_1_output_0/blocks.26/self_attn/Mul_1"Mul  !/blocks.26/self_attn/Mul_output_0 #/blocks.26/self_attn/Mul_1_output_0!/blocks.26/self_attn/Add_output_0/blocks.26/self_attn/Add"Add  +/blocks.26/self_attn/k_norm/Cast_2_output_0 %/blocks.0/self_attn/Gather_2_output_0#/blocks.26/self_attn/Mul_2_output_0/blocks.26/self_attn/Mul_2"Mul y +/blocks.26/self_attn/k_norm/Cast_2_output_0%/blocks.26/self_attn/Shape_3_output_0/blocks.26/self_attn/Shape_3"Shape )/blocks.26/self_attn/Constant_18_output_0 /blocks.26/self_attn/Constant_18"Constant*F value*:B,/blocks.26/self_attn/Constant_18_attr::valueJ  %/blocks.26/self_attn/Shape_3_output_0 )/blocks.26/self_attn/Constant_18_output_0&/blocks.26/self_attn/Gather_3_output_0/blocks.26/self_attn/Gather_3"Gather* axis )/blocks.26/self_attn/Constant_19_output_0 /blocks.26/self_attn/Constant_19"Constant*F value*:B,/blocks.26/self_attn/Constant_19_attr::valueJ  &/blocks.26/self_attn/Gather_3_output_0 )/blocks.26/self_attn/Constant_19_output_0#/blocks.26/self_attn/Div_1_output_0/blocks.26/self_attn/Div_1"Div y #/blocks.26/self_attn/Div_1_output_0$/blocks.26/self_attn/Cast_2_output_0/blocks.26/self_attn/Cast_2"Cast* to z $/blocks.26/self_attn/Cast_2_output_0$/blocks.26/self_attn/Cast_3_output_0/blocks.26/self_attn/Cast_3"Cast* to )/blocks.26/self_attn/Constant_20_output_0 /blocks.26/self_attn/Constant_20"Constant*H value*<B,/blocks.26/self_attn/Constant_20_attr::valueJ )/blocks.26/self_attn/Constant_21_output_0 /blocks.26/self_attn/Constant_21"Constant*H value*<B,/blocks.26/self_attn/Constant_21_attr::valueJ )/blocks.26/self_attn/Constant_22_output_0 /blocks.26/self_attn/Constant_22"Constant*H value*<B,/blocks.26/self_attn/Constant_22_attr::valueJ  $/blocks.26/self_attn/Cast_3_output_0 )/blocks.26/self_attn/Constant_22_output_0)/blocks.26/self_attn/Unsqueeze_8_output_0 /blocks.26/self_attn/Unsqueeze_8" Unsqueeze )/blocks.26/self_attn/Constant_23_output_0 /blocks.26/self_attn/Constant_23"Constant*H value*<B,/blocks.26/self_attn/Constant_23_attr::valueJ  +/blocks.26/self_attn/k_norm/Cast_2_output_0 )/blocks.26/self_attn/Constant_21_output_0 )/blocks.26/self_attn/Unsqueeze_8_output_0 )/blocks.26/self_attn/Constant_20_output_0 )/blocks.26/self_attn/Constant_23_output_0%/blocks.26/self_attn/Slice_2_output_0/blocks.26/self_attn/Slice_2"Slice )/blocks.26/self_attn/Constant_24_output_0 /blocks.26/self_attn/Constant_24"Constant*H value*<B,/blocks.26/self_attn/Constant_24_attr::valueJ )/blocks.26/self_attn/Constant_25_output_0 /blocks.26/self_attn/Constant_25"Constant*H value*<B,/blocks.26/self_attn/Constant_25_attr::valueJ  $/blocks.26/self_attn/Cast_3_output_0 )/blocks.26/self_attn/Constant_25_output_0)/blocks.26/self_attn/Unsqueeze_9_output_0 /blocks.26/self_attn/Unsqueeze_9" Unsqueeze )/blocks.26/self_attn/Constant_26_output_0 /blocks.26/self_attn/Constant_26"Constant*H value*<B,/blocks.26/self_attn/Constant_26_attr::valueJ )/blocks.26/self_attn/Constant_27_output_0 /blocks.26/self_attn/Constant_27"Constant*H value*<B,/blocks.26/self_attn/Constant_27_attr::valueJ  +/blocks.26/self_attn/k_norm/Cast_2_output_0 )/blocks.26/self_attn/Unsqueeze_9_output_0 )/blocks.26/self_attn/Constant_26_output_0 )/blocks.26/self_attn/Constant_24_output_0 )/blocks.26/self_attn/Constant_27_output_0%/blocks.26/self_attn/Slice_3_output_0/blocks.26/self_attn/Slice_3"Slice m %/blocks.26/self_attn/Slice_3_output_0#/blocks.26/self_attn/Neg_1_output_0/blocks.26/self_attn/Neg_1"Neg  #/blocks.26/self_attn/Neg_1_output_0 %/blocks.26/self_attn/Slice_2_output_0&/blocks.26/self_attn/Concat_4_output_0/blocks.26/self_attn/Concat_4"Concat* axis  &/blocks.26/self_attn/Concat_4_output_0 %/blocks.0/self_attn/Gather_3_output_0#/blocks.26/self_attn/Mul_3_output_0/blocks.26/self_attn/Mul_3"Mul  #/blocks.26/self_attn/Mul_2_output_0 #/blocks.26/self_attn/Mul_3_output_0#/blocks.26/self_attn/Add_1_output_0/blocks.26/self_attn/Add_1"Add  /Gather_26_output_0 /rotary/Constant_3_output_0&/blocks.26/self_attn/Gather_4_output_0/blocks.26/self_attn/Gather_4"Gather* axis  /Gather_26_output_0 /rotary/Constant_8_output_0&/blocks.26/self_attn/Gather_5_output_0/blocks.26/self_attn/Gather_5"Gather* axis  &/blocks.26/self_attn/Gather_4_output_0 #/blocks.26/self_attn/Add_1_output_0&/blocks.26/self_attn/Concat_5_output_0/blocks.26/self_attn/Concat_5"Concat* axis  &/blocks.26/self_attn/Gather_5_output_0 '/blocks.26/self_attn/Reshape_2_output_0&/blocks.26/self_attn/Concat_6_output_0/blocks.26/self_attn/Concat_6"Concat* axis )/blocks.26/self_attn/Constant_28_output_0 /blocks.26/self_attn/Constant_28"Constant*H value*<B,/blocks.26/self_attn/Constant_28_attr::valueJ  &/blocks.26/self_attn/Concat_5_output_0 )/blocks.26/self_attn/Constant_28_output_0*/blocks.26/self_attn/Unsqueeze_10_output_0!/blocks.26/self_attn/Unsqueeze_10" Unsqueeze )/blocks.26/self_attn/Constant_29_output_0 /blocks.26/self_attn/Constant_29"Constant*H value*<B,/blocks.26/self_attn/Constant_29_attr::valueJ  &/blocks.26/self_attn/Concat_6_output_0 )/blocks.26/self_attn/Constant_29_output_0*/blocks.26/self_attn/Unsqueeze_11_output_0!/blocks.26/self_attn/Unsqueeze_11" Unsqueeze  */blocks.26/self_attn/Unsqueeze_10_output_0 */blocks.26/self_attn/Unsqueeze_11_output_0&/blocks.26/self_attn/Concat_7_output_0/blocks.26/self_attn/Concat_7"Concat* axis  !/blocks.26/self_attn/Add_output_0'/blocks.26/self_attn/Transpose_output_0/blocks.26/self_attn/Transpose" Transpose* perm@@@@  &/blocks.26/self_attn/Concat_5_output_0)/blocks.26/self_attn/Transpose_1_output_0 /blocks.26/self_attn/Transpose_1" Transpose* perm@@@@  &/blocks.26/self_attn/Concat_6_output_0)/blocks.26/self_attn/Transpose_2_output_0 /blocks.26/self_attn/Transpose_2" Transpose* perm@@@@ w )/blocks.26/self_attn/Transpose_1_output_0%/blocks.26/self_attn/Shape_4_output_0/blocks.26/self_attn/Shape_4"Shape )/blocks.26/self_attn/Constant_30_output_0 /blocks.26/self_attn/Constant_30"Constant*F value*:B,/blocks.26/self_attn/Constant_30_attr::valueJ  %/blocks.26/self_attn/Shape_4_output_0 )/blocks.26/self_attn/Constant_30_output_0&/blocks.26/self_attn/Gather_6_output_0/blocks.26/self_attn/Gather_6"Gather* axis w )/blocks.26/self_attn/Transpose_1_output_0%/blocks.26/self_attn/Shape_5_output_0/blocks.26/self_attn/Shape_5"Shape )/blocks.26/self_attn/Constant_31_output_0 /blocks.26/self_attn/Constant_31"Constant*F value*:B,/blocks.26/self_attn/Constant_31_attr::valueJ  %/blocks.26/self_attn/Shape_5_output_0 )/blocks.26/self_attn/Constant_31_output_0&/blocks.26/self_attn/Gather_7_output_0/blocks.26/self_attn/Gather_7"Gather* axis w )/blocks.26/self_attn/Transpose_1_output_0%/blocks.26/self_attn/Shape_6_output_0/blocks.26/self_attn/Shape_6"Shape )/blocks.26/self_attn/Constant_32_output_0 /blocks.26/self_attn/Constant_32"Constant*F value*:B,/blocks.26/self_attn/Constant_32_attr::valueJ  %/blocks.26/self_attn/Shape_6_output_0 )/blocks.26/self_attn/Constant_32_output_0&/blocks.26/self_attn/Gather_8_output_0/blocks.26/self_attn/Gather_8"Gather* axis w )/blocks.26/self_attn/Transpose_1_output_0%/blocks.26/self_attn/Shape_7_output_0/blocks.26/self_attn/Shape_7"Shape )/blocks.26/self_attn/Constant_33_output_0 /blocks.26/self_attn/Constant_33"Constant*F value*:B,/blocks.26/self_attn/Constant_33_attr::valueJ  %/blocks.26/self_attn/Shape_7_output_0 )/blocks.26/self_attn/Constant_33_output_0&/blocks.26/self_attn/Gather_9_output_0/blocks.26/self_attn/Gather_9"Gather* axis )/blocks.26/self_attn/Constant_34_output_0 /blocks.26/self_attn/Constant_34"Constant*H value*<B,/blocks.26/self_attn/Constant_34_attr::valueJ  )/blocks.26/self_attn/Transpose_1_output_0 )/blocks.26/self_attn/Constant_34_output_0*/blocks.26/self_attn/Unsqueeze_12_output_0!/blocks.26/self_attn/Unsqueeze_12" Unsqueeze )/blocks.26/self_attn/Constant_35_output_0 /blocks.26/self_attn/Constant_35"Constant*H value*<B,/blocks.26/self_attn/Constant_35_attr::valueJ  &/blocks.26/self_attn/Gather_6_output_0 )/blocks.26/self_attn/Constant_35_output_0*/blocks.26/self_attn/Unsqueeze_13_output_0!/blocks.26/self_attn/Unsqueeze_13" Unsqueeze )/blocks.26/self_attn/Constant_36_output_0 /blocks.26/self_attn/Constant_36"Constant*H value*<B,/blocks.26/self_attn/Constant_36_attr::valueJ  &/blocks.26/self_attn/Gather_7_output_0 )/blocks.26/self_attn/Constant_36_output_0*/blocks.26/self_attn/Unsqueeze_14_output_0!/blocks.26/self_attn/Unsqueeze_14" Unsqueeze )/blocks.26/self_attn/Constant_37_output_0 /blocks.26/self_attn/Constant_37"Constant*H value*<B,/blocks.26/self_attn/Constant_37_attr::valueJ )/blocks.26/self_attn/Constant_38_output_0 /blocks.26/self_attn/Constant_38"Constant*H value*<B,/blocks.26/self_attn/Constant_38_attr::valueJ  &/blocks.26/self_attn/Gather_8_output_0 )/blocks.26/self_attn/Constant_38_output_0*/blocks.26/self_attn/Unsqueeze_15_output_0!/blocks.26/self_attn/Unsqueeze_15" Unsqueeze )/blocks.26/self_attn/Constant_39_output_0 /blocks.26/self_attn/Constant_39"Constant*H value*<B,/blocks.26/self_attn/Constant_39_attr::valueJ  &/blocks.26/self_attn/Gather_9_output_0 )/blocks.26/self_attn/Constant_39_output_0*/blocks.26/self_attn/Unsqueeze_16_output_0!/blocks.26/self_attn/Unsqueeze_16" Unsqueeze  */blocks.26/self_attn/Unsqueeze_13_output_0 */blocks.26/self_attn/Unsqueeze_14_output_0 )/blocks.26/self_attn/Constant_37_output_0 */blocks.26/self_attn/Unsqueeze_15_output_0 */blocks.26/self_attn/Unsqueeze_16_output_0&/blocks.26/self_attn/Concat_8_output_0/blocks.26/self_attn/Concat_8"Concat* axis )/blocks.26/self_attn/Constant_40_output_0 /blocks.26/self_attn/Constant_40"Constant*H value*<B,/blocks.26/self_attn/Constant_40_attr::valueJ  &/blocks.26/self_attn/Concat_8_output_0 )/blocks.26/self_attn/Constant_40_output_0'/blocks.26/self_attn/Reshape_3_output_0/blocks.26/self_attn/Reshape_3"Reshape* allowzero u '/blocks.26/self_attn/Reshape_3_output_0%/blocks.26/self_attn/Shape_8_output_0/blocks.26/self_attn/Shape_8"Shape  %/blocks.26/self_attn/Shape_8_output_0-/blocks.26/self_attn/ConstantOfShape_output_0$/blocks.26/self_attn/ConstantOfShape"ConstantOfShape*L value*@B0/blocks.26/self_attn/ConstantOfShape_attr::valueJ )/blocks.26/self_attn/Constant_41_output_0 /blocks.26/self_attn/Constant_41"Constant*F value*:B,/blocks.26/self_attn/Constant_41_attr::valueJ  -/blocks.26/self_attn/ConstantOfShape_output_0 )/blocks.26/self_attn/Constant_41_output_0#/blocks.26/self_attn/Mul_4_output_0/blocks.26/self_attn/Mul_4"Mul  '/blocks.26/self_attn/Reshape_3_output_0 #/blocks.26/self_attn/Mul_4_output_0#/blocks.26/self_attn/Equal_output_0/blocks.26/self_attn/Equal"Equal  #/blocks.26/self_attn/Equal_output_0 -/blocks.26/self_attn/ConstantOfShape_output_0 '/blocks.26/self_attn/Reshape_3_output_0#/blocks.26/self_attn/Where_output_0/blocks.26/self_attn/Where"Where  */blocks.26/self_attn/Unsqueeze_12_output_0 #/blocks.26/self_attn/Where_output_0$/blocks.26/self_attn/Expand_output_0/blocks.26/self_attn/Expand"Expand )/blocks.26/self_attn/Constant_42_output_0 /blocks.26/self_attn/Constant_42"Constant*F value*:B,/blocks.26/self_attn/Constant_42_attr::valueJ  &/blocks.26/self_attn/Gather_7_output_0 )/blocks.26/self_attn/Constant_42_output_0#/blocks.26/self_attn/Mul_5_output_0/blocks.26/self_attn/Mul_5"Mul fonnx::Unsqueeze_8097 Constant_9532"Constant*5 value*)BConstant_9532_attr::valueJ  &/blocks.26/self_attn/Gather_6_output_0 onnx::Unsqueeze_8097*/blocks.26/self_attn/Unsqueeze_17_output_0!/blocks.26/self_attn/Unsqueeze_17" Unsqueeze fonnx::Unsqueeze_8099 Constant_9534"Constant*5 value*)BConstant_9534_attr::valueJ  #/blocks.26/self_attn/Mul_5_output_0 onnx::Unsqueeze_8099*/blocks.26/self_attn/Unsqueeze_18_output_0!/blocks.26/self_attn/Unsqueeze_18" Unsqueeze fonnx::Unsqueeze_8101 Constant_9536"Constant*5 value*)BConstant_9536_attr::valueJ  &/blocks.26/self_attn/Gather_8_output_0 onnx::Unsqueeze_8101*/blocks.26/self_attn/Unsqueeze_19_output_0!/blocks.26/self_attn/Unsqueeze_19" Unsqueeze fonnx::Unsqueeze_8103 Constant_9538"Constant*5 value*)BConstant_9538_attr::valueJ  &/blocks.26/self_attn/Gather_9_output_0 onnx::Unsqueeze_8103*/blocks.26/self_attn/Unsqueeze_20_output_0!/blocks.26/self_attn/Unsqueeze_20" Unsqueeze  */blocks.26/self_attn/Unsqueeze_17_output_0 */blocks.26/self_attn/Unsqueeze_18_output_0 */blocks.26/self_attn/Unsqueeze_19_output_0 */blocks.26/self_attn/Unsqueeze_20_output_0&/blocks.26/self_attn/Concat_9_output_0/blocks.26/self_attn/Concat_9"Concat* axis  $/blocks.26/self_attn/Expand_output_0 &/blocks.26/self_attn/Concat_9_output_0'/blocks.26/self_attn/Reshape_4_output_0/blocks.26/self_attn/Reshape_4"Reshape* allowzero w )/blocks.26/self_attn/Transpose_2_output_0%/blocks.26/self_attn/Shape_9_output_0/blocks.26/self_attn/Shape_9"Shape )/blocks.26/self_attn/Constant_43_output_0 /blocks.26/self_attn/Constant_43"Constant*F value*:B,/blocks.26/self_attn/Constant_43_attr::valueJ  %/blocks.26/self_attn/Shape_9_output_0 )/blocks.26/self_attn/Constant_43_output_0'/blocks.26/self_attn/Gather_10_output_0/blocks.26/self_attn/Gather_10"Gather* axis y )/blocks.26/self_attn/Transpose_2_output_0&/blocks.26/self_attn/Shape_10_output_0/blocks.26/self_attn/Shape_10"Shape )/blocks.26/self_attn/Constant_44_output_0 /blocks.26/self_attn/Constant_44"Constant*F value*:B,/blocks.26/self_attn/Constant_44_attr::valueJ  &/blocks.26/self_attn/Shape_10_output_0 )/blocks.26/self_attn/Constant_44_output_0'/blocks.26/self_attn/Gather_11_output_0/blocks.26/self_attn/Gather_11"Gather* axis y )/blocks.26/self_attn/Transpose_2_output_0&/blocks.26/self_attn/Shape_11_output_0/blocks.26/self_attn/Shape_11"Shape )/blocks.26/self_attn/Constant_45_output_0 /blocks.26/self_attn/Constant_45"Constant*F value*:B,/blocks.26/self_attn/Constant_45_attr::valueJ  &/blocks.26/self_attn/Shape_11_output_0 )/blocks.26/self_attn/Constant_45_output_0'/blocks.26/self_attn/Gather_12_output_0/blocks.26/self_attn/Gather_12"Gather* axis y )/blocks.26/self_attn/Transpose_2_output_0&/blocks.26/self_attn/Shape_12_output_0/blocks.26/self_attn/Shape_12"Shape )/blocks.26/self_attn/Constant_46_output_0 /blocks.26/self_attn/Constant_46"Constant*F value*:B,/blocks.26/self_attn/Constant_46_attr::valueJ  &/blocks.26/self_attn/Shape_12_output_0 )/blocks.26/self_attn/Constant_46_output_0'/blocks.26/self_attn/Gather_13_output_0/blocks.26/self_attn/Gather_13"Gather* axis )/blocks.26/self_attn/Constant_47_output_0 /blocks.26/self_attn/Constant_47"Constant*H value*<B,/blocks.26/self_attn/Constant_47_attr::valueJ  )/blocks.26/self_attn/Transpose_2_output_0 )/blocks.26/self_attn/Constant_47_output_0*/blocks.26/self_attn/Unsqueeze_21_output_0!/blocks.26/self_attn/Unsqueeze_21" Unsqueeze )/blocks.26/self_attn/Constant_48_output_0 /blocks.26/self_attn/Constant_48"Constant*H value*<B,/blocks.26/self_attn/Constant_48_attr::valueJ  '/blocks.26/self_attn/Gather_10_output_0 )/blocks.26/self_attn/Constant_48_output_0*/blocks.26/self_attn/Unsqueeze_22_output_0!/blocks.26/self_attn/Unsqueeze_22" Unsqueeze )/blocks.26/self_attn/Constant_49_output_0 /blocks.26/self_attn/Constant_49"Constant*H value*<B,/blocks.26/self_attn/Constant_49_attr::valueJ  '/blocks.26/self_attn/Gather_11_output_0 )/blocks.26/self_attn/Constant_49_output_0*/blocks.26/self_attn/Unsqueeze_23_output_0!/blocks.26/self_attn/Unsqueeze_23" Unsqueeze )/blocks.26/self_attn/Constant_50_output_0 /blocks.26/self_attn/Constant_50"Constant*H value*<B,/blocks.26/self_attn/Constant_50_attr::valueJ )/blocks.26/self_attn/Constant_51_output_0 /blocks.26/self_attn/Constant_51"Constant*H value*<B,/blocks.26/self_attn/Constant_51_attr::valueJ  '/blocks.26/self_attn/Gather_12_output_0 )/blocks.26/self_attn/Constant_51_output_0*/blocks.26/self_attn/Unsqueeze_24_output_0!/blocks.26/self_attn/Unsqueeze_24" Unsqueeze )/blocks.26/self_attn/Constant_52_output_0 /blocks.26/self_attn/Constant_52"Constant*H value*<B,/blocks.26/self_attn/Constant_52_attr::valueJ  '/blocks.26/self_attn/Gather_13_output_0 )/blocks.26/self_attn/Constant_52_output_0*/blocks.26/self_attn/Unsqueeze_25_output_0!/blocks.26/self_attn/Unsqueeze_25" Unsqueeze  */blocks.26/self_attn/Unsqueeze_22_output_0 */blocks.26/self_attn/Unsqueeze_23_output_0 )/blocks.26/self_attn/Constant_50_output_0 */blocks.26/self_attn/Unsqueeze_24_output_0 */blocks.26/self_attn/Unsqueeze_25_output_0'/blocks.26/self_attn/Concat_10_output_0/blocks.26/self_attn/Concat_10"Concat* axis )/blocks.26/self_attn/Constant_53_output_0 /blocks.26/self_attn/Constant_53"Constant*H value*<B,/blocks.26/self_attn/Constant_53_attr::valueJ  '/blocks.26/self_attn/Concat_10_output_0 )/blocks.26/self_attn/Constant_53_output_0'/blocks.26/self_attn/Reshape_5_output_0/blocks.26/self_attn/Reshape_5"Reshape* allowzero w '/blocks.26/self_attn/Reshape_5_output_0&/blocks.26/self_attn/Shape_13_output_0/blocks.26/self_attn/Shape_13"Shape  &/blocks.26/self_attn/Shape_13_output_0//blocks.26/self_attn/ConstantOfShape_1_output_0&/blocks.26/self_attn/ConstantOfShape_1"ConstantOfShape*N value*BB2/blocks.26/self_attn/ConstantOfShape_1_attr::valueJ )/blocks.26/self_attn/Constant_54_output_0 /blocks.26/self_attn/Constant_54"Constant*F value*:B,/blocks.26/self_attn/Constant_54_attr::valueJ  //blocks.26/self_attn/ConstantOfShape_1_output_0 )/blocks.26/self_attn/Constant_54_output_0#/blocks.26/self_attn/Mul_6_output_0/blocks.26/self_attn/Mul_6"Mul  '/blocks.26/self_attn/Reshape_5_output_0 #/blocks.26/self_attn/Mul_6_output_0%/blocks.26/self_attn/Equal_1_output_0/blocks.26/self_attn/Equal_1"Equal  %/blocks.26/self_attn/Equal_1_output_0 //blocks.26/self_attn/ConstantOfShape_1_output_0 '/blocks.26/self_attn/Reshape_5_output_0%/blocks.26/self_attn/Where_1_output_0/blocks.26/self_attn/Where_1"Where  */blocks.26/self_attn/Unsqueeze_21_output_0 %/blocks.26/self_attn/Where_1_output_0&/blocks.26/self_attn/Expand_1_output_0/blocks.26/self_attn/Expand_1"Expand )/blocks.26/self_attn/Constant_55_output_0 /blocks.26/self_attn/Constant_55"Constant*F value*:B,/blocks.26/self_attn/Constant_55_attr::valueJ  '/blocks.26/self_attn/Gather_11_output_0 )/blocks.26/self_attn/Constant_55_output_0#/blocks.26/self_attn/Mul_7_output_0/blocks.26/self_attn/Mul_7"Mul fonnx::Unsqueeze_8143 Constant_9577"Constant*5 value*)BConstant_9577_attr::valueJ  '/blocks.26/self_attn/Gather_10_output_0 onnx::Unsqueeze_8143*/blocks.26/self_attn/Unsqueeze_26_output_0!/blocks.26/self_attn/Unsqueeze_26" Unsqueeze fonnx::Unsqueeze_8145 Constant_9579"Constant*5 value*)BConstant_9579_attr::valueJ  #/blocks.26/self_attn/Mul_7_output_0 onnx::Unsqueeze_8145*/blocks.26/self_attn/Unsqueeze_27_output_0!/blocks.26/self_attn/Unsqueeze_27" Unsqueeze fonnx::Unsqueeze_8147 Constant_9581"Constant*5 value*)BConstant_9581_attr::valueJ  '/blocks.26/self_attn/Gather_12_output_0 onnx::Unsqueeze_8147*/blocks.26/self_attn/Unsqueeze_28_output_0!/blocks.26/self_attn/Unsqueeze_28" Unsqueeze fonnx::Unsqueeze_8149 Constant_9583"Constant*5 value*)BConstant_9583_attr::valueJ  '/blocks.26/self_attn/Gather_13_output_0 onnx::Unsqueeze_8149*/blocks.26/self_attn/Unsqueeze_29_output_0!/blocks.26/self_attn/Unsqueeze_29" Unsqueeze  */blocks.26/self_attn/Unsqueeze_26_output_0 */blocks.26/self_attn/Unsqueeze_27_output_0 */blocks.26/self_attn/Unsqueeze_28_output_0 */blocks.26/self_attn/Unsqueeze_29_output_0'/blocks.26/self_attn/Concat_11_output_0/blocks.26/self_attn/Concat_11"Concat* axis  &/blocks.26/self_attn/Expand_1_output_0 '/blocks.26/self_attn/Concat_11_output_0'/blocks.26/self_attn/Reshape_6_output_0/blocks.26/self_attn/Reshape_6"Reshape* allowzero  '/blocks.26/self_attn/Transpose_output_0 '/blocks.26/self_attn/Reshape_4_output_0$/blocks.26/self_attn/MatMul_output_0/blocks.26/self_attn/MatMul"MatMul )/blocks.26/self_attn/Constant_56_output_0 /blocks.26/self_attn/Constant_56"Constant*B value*6B,/blocks.26/self_attn/Constant_56_attr::valueJ5A  $/blocks.26/self_attn/MatMul_output_0 )/blocks.26/self_attn/Constant_56_output_0#/blocks.26/self_attn/Div_2_output_0/blocks.26/self_attn/Div_2"Div { #/blocks.26/self_attn/Div_2_output_0 attention_mask#/blocks.26/self_attn/Add_2_output_0/blocks.26/self_attn/Add_2"Add  #/blocks.26/self_attn/Add_2_output_0%/blocks.26/self_attn/Softmax_output_0/blocks.26/self_attn/Softmax"Softmax* axis { %/blocks.26/self_attn/Softmax_output_0$/blocks.26/self_attn/Cast_4_output_0/blocks.26/self_attn/Cast_4"Cast* to  $/blocks.26/self_attn/Cast_4_output_0 '/blocks.26/self_attn/Reshape_6_output_0&/blocks.26/self_attn/MatMul_1_output_0/blocks.26/self_attn/MatMul_1"MatMul  &/blocks.26/self_attn/MatMul_1_output_0)/blocks.26/self_attn/Transpose_3_output_0 /blocks.26/self_attn/Transpose_3" Transpose* perm@@@@ fonnx::Unsqueeze_8161 Constant_9595"Constant*5 value*)BConstant_9595_attr::valueJ  $/blocks.26/self_attn/Gather_output_0 onnx::Unsqueeze_8161*/blocks.26/self_attn/Unsqueeze_30_output_0!/blocks.26/self_attn/Unsqueeze_30" Unsqueeze fonnx::Unsqueeze_8163 Constant_9597"Constant*5 value*)BConstant_9597_attr::valueJ  &/blocks.26/self_attn/Gather_1_output_0 onnx::Unsqueeze_8163*/blocks.26/self_attn/Unsqueeze_31_output_0!/blocks.26/self_attn/Unsqueeze_31" Unsqueeze )/blocks.26/self_attn/Constant_57_output_0 /blocks.26/self_attn/Constant_57"Constant*H value*<B,/blocks.26/self_attn/Constant_57_attr::valueJ  */blocks.26/self_attn/Unsqueeze_30_output_0 */blocks.26/self_attn/Unsqueeze_31_output_0 )/blocks.26/self_attn/Constant_57_output_0'/blocks.26/self_attn/Concat_12_output_0/blocks.26/self_attn/Concat_12"Concat* axis  )/blocks.26/self_attn/Transpose_3_output_0 '/blocks.26/self_attn/Concat_12_output_0'/blocks.26/self_attn/Reshape_7_output_0/blocks.26/self_attn/Reshape_7"Reshape* allowzero  '/blocks.26/self_attn/Reshape_7_output_0 onnx::MatMul_9317+/blocks.26/self_attn/o_proj/MatMul_output_0"/blocks.26/self_attn/o_proj/MatMul"MatMul  */blocks.26/input_layernorm/Cast_1_output_0 +/blocks.26/self_attn/o_proj/MatMul_output_0/blocks.26/Add_output_0/blocks.26/Add"Add  /blocks.26/Add_output_01/blocks.26/post_attention_layernorm/Cast_output_0(/blocks.26/post_attention_layernorm/Cast"Cast* to 5/blocks.26/post_attention_layernorm/Constant_output_0,/blocks.26/post_attention_layernorm/Constant"Constant*N value*BB8/blocks.26/post_attention_layernorm/Constant_attr::valueJ@  1/blocks.26/post_attention_layernorm/Cast_output_0 5/blocks.26/post_attention_layernorm/Constant_output_00/blocks.26/post_attention_layernorm/Pow_output_0'/blocks.26/post_attention_layernorm/Pow"Pow  0/blocks.26/post_attention_layernorm/Pow_output_07/blocks.26/post_attention_layernorm/ReduceMean_output_0./blocks.26/post_attention_layernorm/ReduceMean" ReduceMean* axes@* keepdims 7/blocks.26/post_attention_layernorm/Constant_1_output_0./blocks.26/post_attention_layernorm/Constant_1"Constant*P value*DB:/blocks.26/post_attention_layernorm/Constant_1_attr::valueJ75  7/blocks.26/post_attention_layernorm/ReduceMean_output_0 7/blocks.26/post_attention_layernorm/Constant_1_output_00/blocks.26/post_attention_layernorm/Add_output_0'/blocks.26/post_attention_layernorm/Add"Add  0/blocks.26/post_attention_layernorm/Add_output_01/blocks.26/post_attention_layernorm/Sqrt_output_0(/blocks.26/post_attention_layernorm/Sqrt"Sqrt 7/blocks.26/post_attention_layernorm/Constant_2_output_0./blocks.26/post_attention_layernorm/Constant_2"Constant*P value*DB:/blocks.26/post_attention_layernorm/Constant_2_attr::valueJ?  7/blocks.26/post_attention_layernorm/Constant_2_output_0 1/blocks.26/post_attention_layernorm/Sqrt_output_00/blocks.26/post_attention_layernorm/Div_output_0'/blocks.26/post_attention_layernorm/Div"Div  1/blocks.26/post_attention_layernorm/Cast_output_03/blocks.26/post_attention_layernorm/Cast_1_output_0*/blocks.26/post_attention_layernorm/Cast_1"Cast* to  3/blocks.26/post_attention_layernorm/Cast_1_output_0 0/blocks.26/post_attention_layernorm/Div_output_00/blocks.26/post_attention_layernorm/Mul_output_0'/blocks.26/post_attention_layernorm/Mul"Mul  0/blocks.26/post_attention_layernorm/Mul_output_0 )blocks.26.post_attention_layernorm.weight2/blocks.26/post_attention_layernorm/Mul_1_output_0)/blocks.26/post_attention_layernorm/Mul_1"Mul  2/blocks.26/post_attention_layernorm/Mul_1_output_03/blocks.26/post_attention_layernorm/Cast_2_output_0*/blocks.26/post_attention_layernorm/Cast_2"Cast* to  3/blocks.26/post_attention_layernorm/Cast_2_output_0 onnx::MatMul_9318(/blocks.26/mlp/gate_proj/MatMul_output_0/blocks.26/mlp/gate_proj/MatMul"MatMul z (/blocks.26/mlp/gate_proj/MatMul_output_0&/blocks.26/mlp/act_fn/Sigmoid_output_0/blocks.26/mlp/act_fn/Sigmoid"Sigmoid  (/blocks.26/mlp/gate_proj/MatMul_output_0 &/blocks.26/mlp/act_fn/Sigmoid_output_0"/blocks.26/mlp/act_fn/Mul_output_0/blocks.26/mlp/act_fn/Mul"Mul  3/blocks.26/post_attention_layernorm/Cast_2_output_0 onnx::MatMul_9319&/blocks.26/mlp/up_proj/MatMul_output_0/blocks.26/mlp/up_proj/MatMul"MatMul  "/blocks.26/mlp/act_fn/Mul_output_0 &/blocks.26/mlp/up_proj/MatMul_output_0/blocks.26/mlp/Mul_output_0/blocks.26/mlp/Mul"Mul  /blocks.26/mlp/Mul_output_0 onnx::MatMul_9320(/blocks.26/mlp/down_proj/MatMul_output_0/blocks.26/mlp/down_proj/MatMul"MatMul  3/blocks.26/post_attention_layernorm/Cast_1_output_0 (/blocks.26/mlp/down_proj/MatMul_output_0/blocks.26/Add_1_output_0/blocks.26/Add_1"Add c/Constant_19_output_0 /Constant_19"Constant*2 value*&B/Constant_19_attr::valueJ ^ past_key_values /Constant_19_output_0/Gather_27_output_0 /Gather_27"Gather* axis /blocks.27/Constant_output_0/blocks.27/Constant"Constant*K value*?B/blocks.27/Constant_attr::valueJ  /blocks.26/Add_1_output_0 /blocks.27/Constant_output_0/blocks.27/Reshape_output_0/blocks.27/Reshape"Reshape* allowzero y /blocks.27/Reshape_output_0(/blocks.27/input_layernorm/Cast_output_0/blocks.27/input_layernorm/Cast"Cast* to ,/blocks.27/input_layernorm/Constant_output_0#/blocks.27/input_layernorm/Constant"Constant*E value*9B//blocks.27/input_layernorm/Constant_attr::valueJ@  (/blocks.27/input_layernorm/Cast_output_0 ,/blocks.27/input_layernorm/Constant_output_0'/blocks.27/input_layernorm/Pow_output_0/blocks.27/input_layernorm/Pow"Pow  '/blocks.27/input_layernorm/Pow_output_0./blocks.27/input_layernorm/ReduceMean_output_0%/blocks.27/input_layernorm/ReduceMean" ReduceMean* axes@* keepdims ./blocks.27/input_layernorm/Constant_1_output_0%/blocks.27/input_layernorm/Constant_1"Constant*G value*;B1/blocks.27/input_layernorm/Constant_1_attr::valueJ75  ./blocks.27/input_layernorm/ReduceMean_output_0 ./blocks.27/input_layernorm/Constant_1_output_0'/blocks.27/input_layernorm/Add_output_0/blocks.27/input_layernorm/Add"Add z '/blocks.27/input_layernorm/Add_output_0(/blocks.27/input_layernorm/Sqrt_output_0/blocks.27/input_layernorm/Sqrt"Sqrt ./blocks.27/input_layernorm/Constant_2_output_0%/blocks.27/input_layernorm/Constant_2"Constant*G value*;B1/blocks.27/input_layernorm/Constant_2_attr::valueJ?  ./blocks.27/input_layernorm/Constant_2_output_0 (/blocks.27/input_layernorm/Sqrt_output_0'/blocks.27/input_layernorm/Div_output_0/blocks.27/input_layernorm/Div"Div  (/blocks.27/input_layernorm/Cast_output_0*/blocks.27/input_layernorm/Cast_1_output_0!/blocks.27/input_layernorm/Cast_1"Cast* to  */blocks.27/input_layernorm/Cast_1_output_0 '/blocks.27/input_layernorm/Div_output_0'/blocks.27/input_layernorm/Mul_output_0/blocks.27/input_layernorm/Mul"Mul  '/blocks.27/input_layernorm/Mul_output_0 blocks.27.input_layernorm.weight)/blocks.27/input_layernorm/Mul_1_output_0 /blocks.27/input_layernorm/Mul_1"Mul  )/blocks.27/input_layernorm/Mul_1_output_0*/blocks.27/input_layernorm/Cast_2_output_0!/blocks.27/input_layernorm/Cast_2"Cast* to t */blocks.27/input_layernorm/Cast_2_output_0#/blocks.27/self_attn/Shape_output_0/blocks.27/self_attn/Shape"Shape &/blocks.27/self_attn/Constant_output_0/blocks.27/self_attn/Constant"Constant*C value*7B)/blocks.27/self_attn/Constant_attr::valueJ  #/blocks.27/self_attn/Shape_output_0 &/blocks.27/self_attn/Constant_output_0$/blocks.27/self_attn/Gather_output_0/blocks.27/self_attn/Gather"Gather* axis x */blocks.27/input_layernorm/Cast_2_output_0%/blocks.27/self_attn/Shape_1_output_0/blocks.27/self_attn/Shape_1"Shape (/blocks.27/self_attn/Constant_1_output_0/blocks.27/self_attn/Constant_1"Constant*E value*9B+/blocks.27/self_attn/Constant_1_attr::valueJ  %/blocks.27/self_attn/Shape_1_output_0 (/blocks.27/self_attn/Constant_1_output_0&/blocks.27/self_attn/Gather_1_output_0/blocks.27/self_attn/Gather_1"Gather* axis  */blocks.27/input_layernorm/Cast_2_output_0 onnx::MatMul_9321+/blocks.27/self_attn/q_proj/MatMul_output_0"/blocks.27/self_attn/q_proj/MatMul"MatMul  */blocks.27/input_layernorm/Cast_2_output_0 onnx::MatMul_9322+/blocks.27/self_attn/k_proj/MatMul_output_0"/blocks.27/self_attn/k_proj/MatMul"MatMul  */blocks.27/input_layernorm/Cast_2_output_0 onnx::MatMul_9323+/blocks.27/self_attn/v_proj/MatMul_output_0"/blocks.27/self_attn/v_proj/MatMul"MatMul fonnx::Unsqueeze_8224 Constant_9650"Constant*5 value*)BConstant_9650_attr::valueJ  $/blocks.27/self_attn/Gather_output_0 onnx::Unsqueeze_8224'/blocks.27/self_attn/Unsqueeze_output_0/blocks.27/self_attn/Unsqueeze" Unsqueeze fonnx::Unsqueeze_8226 Constant_9652"Constant*5 value*)BConstant_9652_attr::valueJ  &/blocks.27/self_attn/Gather_1_output_0 onnx::Unsqueeze_8226)/blocks.27/self_attn/Unsqueeze_1_output_0 /blocks.27/self_attn/Unsqueeze_1" Unsqueeze (/blocks.27/self_attn/Constant_2_output_0/blocks.27/self_attn/Constant_2"Constant*G value*;B+/blocks.27/self_attn/Constant_2_attr::valueJ (/blocks.27/self_attn/Constant_3_output_0/blocks.27/self_attn/Constant_3"Constant*G value*;B+/blocks.27/self_attn/Constant_3_attr::valueJ  '/blocks.27/self_attn/Unsqueeze_output_0 )/blocks.27/self_attn/Unsqueeze_1_output_0 (/blocks.27/self_attn/Constant_2_output_0 (/blocks.27/self_attn/Constant_3_output_0$/blocks.27/self_attn/Concat_output_0/blocks.27/self_attn/Concat"Concat* axis  +/blocks.27/self_attn/q_proj/MatMul_output_0 $/blocks.27/self_attn/Concat_output_0%/blocks.27/self_attn/Reshape_output_0/blocks.27/self_attn/Reshape"Reshape* allowzero fonnx::Unsqueeze_8234 Constant_9658"Constant*5 value*)BConstant_9658_attr::valueJ  $/blocks.27/self_attn/Gather_output_0 onnx::Unsqueeze_8234)/blocks.27/self_attn/Unsqueeze_2_output_0 /blocks.27/self_attn/Unsqueeze_2" Unsqueeze fonnx::Unsqueeze_8236 Constant_9660"Constant*5 value*)BConstant_9660_attr::valueJ  &/blocks.27/self_attn/Gather_1_output_0 onnx::Unsqueeze_8236)/blocks.27/self_attn/Unsqueeze_3_output_0 /blocks.27/self_attn/Unsqueeze_3" Unsqueeze (/blocks.27/self_attn/Constant_4_output_0/blocks.27/self_attn/Constant_4"Constant*G value*;B+/blocks.27/self_attn/Constant_4_attr::valueJ (/blocks.27/self_attn/Constant_5_output_0/blocks.27/self_attn/Constant_5"Constant*G value*;B+/blocks.27/self_attn/Constant_5_attr::valueJ  )/blocks.27/self_attn/Unsqueeze_2_output_0 )/blocks.27/self_attn/Unsqueeze_3_output_0 (/blocks.27/self_attn/Constant_4_output_0 (/blocks.27/self_attn/Constant_5_output_0&/blocks.27/self_attn/Concat_1_output_0/blocks.27/self_attn/Concat_1"Concat* axis fonnx::Unsqueeze_8243 Constant_9665"Constant*5 value*)BConstant_9665_attr::valueJ  $/blocks.27/self_attn/Gather_output_0 onnx::Unsqueeze_8243)/blocks.27/self_attn/Unsqueeze_4_output_0 /blocks.27/self_attn/Unsqueeze_4" Unsqueeze fonnx::Unsqueeze_8245 Constant_9667"Constant*5 value*)BConstant_9667_attr::valueJ  &/blocks.27/self_attn/Gather_1_output_0 onnx::Unsqueeze_8245)/blocks.27/self_attn/Unsqueeze_5_output_0 /blocks.27/self_attn/Unsqueeze_5" Unsqueeze (/blocks.27/self_attn/Constant_6_output_0/blocks.27/self_attn/Constant_6"Constant*G value*;B+/blocks.27/self_attn/Constant_6_attr::valueJ (/blocks.27/self_attn/Constant_7_output_0/blocks.27/self_attn/Constant_7"Constant*G value*;B+/blocks.27/self_attn/Constant_7_attr::valueJ  )/blocks.27/self_attn/Unsqueeze_4_output_0 )/blocks.27/self_attn/Unsqueeze_5_output_0 (/blocks.27/self_attn/Constant_6_output_0 (/blocks.27/self_attn/Constant_7_output_0&/blocks.27/self_attn/Concat_2_output_0/blocks.27/self_attn/Concat_2"Concat* axis  +/blocks.27/self_attn/k_proj/MatMul_output_0 &/blocks.27/self_attn/Concat_1_output_0'/blocks.27/self_attn/Reshape_1_output_0/blocks.27/self_attn/Reshape_1"Reshape* allowzero  +/blocks.27/self_attn/v_proj/MatMul_output_0 &/blocks.27/self_attn/Concat_2_output_0'/blocks.27/self_attn/Reshape_2_output_0/blocks.27/self_attn/Reshape_2"Reshape* allowzero  %/blocks.27/self_attn/Reshape_output_0)/blocks.27/self_attn/q_norm/Cast_output_0 /blocks.27/self_attn/q_norm/Cast"Cast* to -/blocks.27/self_attn/q_norm/Constant_output_0$/blocks.27/self_attn/q_norm/Constant"Constant*F value*:B0/blocks.27/self_attn/q_norm/Constant_attr::valueJ@  )/blocks.27/self_attn/q_norm/Cast_output_0 -/blocks.27/self_attn/q_norm/Constant_output_0(/blocks.27/self_attn/q_norm/Pow_output_0/blocks.27/self_attn/q_norm/Pow"Pow  (/blocks.27/self_attn/q_norm/Pow_output_0//blocks.27/self_attn/q_norm/ReduceMean_output_0&/blocks.27/self_attn/q_norm/ReduceMean" ReduceMean* axes@* keepdims //blocks.27/self_attn/q_norm/Constant_1_output_0&/blocks.27/self_attn/q_norm/Constant_1"Constant*H value*<B2/blocks.27/self_attn/q_norm/Constant_1_attr::valueJ75  //blocks.27/self_attn/q_norm/ReduceMean_output_0 //blocks.27/self_attn/q_norm/Constant_1_output_0(/blocks.27/self_attn/q_norm/Add_output_0/blocks.27/self_attn/q_norm/Add"Add } (/blocks.27/self_attn/q_norm/Add_output_0)/blocks.27/self_attn/q_norm/Sqrt_output_0 /blocks.27/self_attn/q_norm/Sqrt"Sqrt //blocks.27/self_attn/q_norm/Constant_2_output_0&/blocks.27/self_attn/q_norm/Constant_2"Constant*H value*<B2/blocks.27/self_attn/q_norm/Constant_2_attr::valueJ?  //blocks.27/self_attn/q_norm/Constant_2_output_0 )/blocks.27/self_attn/q_norm/Sqrt_output_0(/blocks.27/self_attn/q_norm/Div_output_0/blocks.27/self_attn/q_norm/Div"Div  )/blocks.27/self_attn/q_norm/Cast_output_0+/blocks.27/self_attn/q_norm/Cast_1_output_0"/blocks.27/self_attn/q_norm/Cast_1"Cast* to  +/blocks.27/self_attn/q_norm/Cast_1_output_0 (/blocks.27/self_attn/q_norm/Div_output_0(/blocks.27/self_attn/q_norm/Mul_output_0/blocks.27/self_attn/q_norm/Mul"Mul  (/blocks.27/self_attn/q_norm/Mul_output_0 !blocks.27.self_attn.q_norm.weight*/blocks.27/self_attn/q_norm/Mul_1_output_0!/blocks.27/self_attn/q_norm/Mul_1"Mul  */blocks.27/self_attn/q_norm/Mul_1_output_0+/blocks.27/self_attn/q_norm/Cast_2_output_0"/blocks.27/self_attn/q_norm/Cast_2"Cast* to  '/blocks.27/self_attn/Reshape_1_output_0)/blocks.27/self_attn/k_norm/Cast_output_0 /blocks.27/self_attn/k_norm/Cast"Cast* to -/blocks.27/self_attn/k_norm/Constant_output_0$/blocks.27/self_attn/k_norm/Constant"Constant*F value*:B0/blocks.27/self_attn/k_norm/Constant_attr::valueJ@  )/blocks.27/self_attn/k_norm/Cast_output_0 -/blocks.27/self_attn/k_norm/Constant_output_0(/blocks.27/self_attn/k_norm/Pow_output_0/blocks.27/self_attn/k_norm/Pow"Pow  (/blocks.27/self_attn/k_norm/Pow_output_0//blocks.27/self_attn/k_norm/ReduceMean_output_0&/blocks.27/self_attn/k_norm/ReduceMean" ReduceMean* axes@* keepdims //blocks.27/self_attn/k_norm/Constant_1_output_0&/blocks.27/self_attn/k_norm/Constant_1"Constant*H value*<B2/blocks.27/self_attn/k_norm/Constant_1_attr::valueJ75  //blocks.27/self_attn/k_norm/ReduceMean_output_0 //blocks.27/self_attn/k_norm/Constant_1_output_0(/blocks.27/self_attn/k_norm/Add_output_0/blocks.27/self_attn/k_norm/Add"Add } (/blocks.27/self_attn/k_norm/Add_output_0)/blocks.27/self_attn/k_norm/Sqrt_output_0 /blocks.27/self_attn/k_norm/Sqrt"Sqrt //blocks.27/self_attn/k_norm/Constant_2_output_0&/blocks.27/self_attn/k_norm/Constant_2"Constant*H value*<B2/blocks.27/self_attn/k_norm/Constant_2_attr::valueJ?  //blocks.27/self_attn/k_norm/Constant_2_output_0 )/blocks.27/self_attn/k_norm/Sqrt_output_0(/blocks.27/self_attn/k_norm/Div_output_0/blocks.27/self_attn/k_norm/Div"Div  )/blocks.27/self_attn/k_norm/Cast_output_0+/blocks.27/self_attn/k_norm/Cast_1_output_0"/blocks.27/self_attn/k_norm/Cast_1"Cast* to  +/blocks.27/self_attn/k_norm/Cast_1_output_0 (/blocks.27/self_attn/k_norm/Div_output_0(/blocks.27/self_attn/k_norm/Mul_output_0/blocks.27/self_attn/k_norm/Mul"Mul  (/blocks.27/self_attn/k_norm/Mul_output_0 !blocks.27.self_attn.k_norm.weight*/blocks.27/self_attn/k_norm/Mul_1_output_0!/blocks.27/self_attn/k_norm/Mul_1"Mul  */blocks.27/self_attn/k_norm/Mul_1_output_0+/blocks.27/self_attn/k_norm/Cast_2_output_0"/blocks.27/self_attn/k_norm/Cast_2"Cast* to  +/blocks.27/self_attn/q_norm/Cast_2_output_0 %/blocks.0/self_attn/Gather_2_output_0!/blocks.27/self_attn/Mul_output_0/blocks.27/self_attn/Mul"Mul y +/blocks.27/self_attn/q_norm/Cast_2_output_0%/blocks.27/self_attn/Shape_2_output_0/blocks.27/self_attn/Shape_2"Shape (/blocks.27/self_attn/Constant_8_output_0/blocks.27/self_attn/Constant_8"Constant*E value*9B+/blocks.27/self_attn/Constant_8_attr::valueJ  %/blocks.27/self_attn/Shape_2_output_0 (/blocks.27/self_attn/Constant_8_output_0&/blocks.27/self_attn/Gather_2_output_0/blocks.27/self_attn/Gather_2"Gather* axis (/blocks.27/self_attn/Constant_9_output_0/blocks.27/self_attn/Constant_9"Constant*E value*9B+/blocks.27/self_attn/Constant_9_attr::valueJ  &/blocks.27/self_attn/Gather_2_output_0 (/blocks.27/self_attn/Constant_9_output_0!/blocks.27/self_attn/Div_output_0/blocks.27/self_attn/Div"Div s !/blocks.27/self_attn/Div_output_0"/blocks.27/self_attn/Cast_output_0/blocks.27/self_attn/Cast"Cast* to x "/blocks.27/self_attn/Cast_output_0$/blocks.27/self_attn/Cast_1_output_0/blocks.27/self_attn/Cast_1"Cast* to )/blocks.27/self_attn/Constant_10_output_0 /blocks.27/self_attn/Constant_10"Constant*H value*<B,/blocks.27/self_attn/Constant_10_attr::valueJ )/blocks.27/self_attn/Constant_11_output_0 /blocks.27/self_attn/Constant_11"Constant*H value*<B,/blocks.27/self_attn/Constant_11_attr::valueJ )/blocks.27/self_attn/Constant_12_output_0 /blocks.27/self_attn/Constant_12"Constant*H value*<B,/blocks.27/self_attn/Constant_12_attr::valueJ  $/blocks.27/self_attn/Cast_1_output_0 )/blocks.27/self_attn/Constant_12_output_0)/blocks.27/self_attn/Unsqueeze_6_output_0 /blocks.27/self_attn/Unsqueeze_6" Unsqueeze )/blocks.27/self_attn/Constant_13_output_0 /blocks.27/self_attn/Constant_13"Constant*H value*<B,/blocks.27/self_attn/Constant_13_attr::valueJ  +/blocks.27/self_attn/q_norm/Cast_2_output_0 )/blocks.27/self_attn/Constant_11_output_0 )/blocks.27/self_attn/Unsqueeze_6_output_0 )/blocks.27/self_attn/Constant_10_output_0 )/blocks.27/self_attn/Constant_13_output_0#/blocks.27/self_attn/Slice_output_0/blocks.27/self_attn/Slice"Slice )/blocks.27/self_attn/Constant_14_output_0 /blocks.27/self_attn/Constant_14"Constant*H value*<B,/blocks.27/self_attn/Constant_14_attr::valueJ )/blocks.27/self_attn/Constant_15_output_0 /blocks.27/self_attn/Constant_15"Constant*H value*<B,/blocks.27/self_attn/Constant_15_attr::valueJ  $/blocks.27/self_attn/Cast_1_output_0 )/blocks.27/self_attn/Constant_15_output_0)/blocks.27/self_attn/Unsqueeze_7_output_0 /blocks.27/self_attn/Unsqueeze_7" Unsqueeze )/blocks.27/self_attn/Constant_16_output_0 /blocks.27/self_attn/Constant_16"Constant*H value*<B,/blocks.27/self_attn/Constant_16_attr::valueJ )/blocks.27/self_attn/Constant_17_output_0 /blocks.27/self_attn/Constant_17"Constant*H value*<B,/blocks.27/self_attn/Constant_17_attr::valueJ  +/blocks.27/self_attn/q_norm/Cast_2_output_0 )/blocks.27/self_attn/Unsqueeze_7_output_0 )/blocks.27/self_attn/Constant_16_output_0 )/blocks.27/self_attn/Constant_14_output_0 )/blocks.27/self_attn/Constant_17_output_0%/blocks.27/self_attn/Slice_1_output_0/blocks.27/self_attn/Slice_1"Slice i %/blocks.27/self_attn/Slice_1_output_0!/blocks.27/self_attn/Neg_output_0/blocks.27/self_attn/Neg"Neg  !/blocks.27/self_attn/Neg_output_0 #/blocks.27/self_attn/Slice_output_0&/blocks.27/self_attn/Concat_3_output_0/blocks.27/self_attn/Concat_3"Concat* axis  &/blocks.27/self_attn/Concat_3_output_0 %/blocks.0/self_attn/Gather_3_output_0#/blocks.27/self_attn/Mul_1_output_0/blocks.27/self_attn/Mul_1"Mul  !/blocks.27/self_attn/Mul_output_0 #/blocks.27/self_attn/Mul_1_output_0!/blocks.27/self_attn/Add_output_0/blocks.27/self_attn/Add"Add  +/blocks.27/self_attn/k_norm/Cast_2_output_0 %/blocks.0/self_attn/Gather_2_output_0#/blocks.27/self_attn/Mul_2_output_0/blocks.27/self_attn/Mul_2"Mul y +/blocks.27/self_attn/k_norm/Cast_2_output_0%/blocks.27/self_attn/Shape_3_output_0/blocks.27/self_attn/Shape_3"Shape )/blocks.27/self_attn/Constant_18_output_0 /blocks.27/self_attn/Constant_18"Constant*F value*:B,/blocks.27/self_attn/Constant_18_attr::valueJ  %/blocks.27/self_attn/Shape_3_output_0 )/blocks.27/self_attn/Constant_18_output_0&/blocks.27/self_attn/Gather_3_output_0/blocks.27/self_attn/Gather_3"Gather* axis )/blocks.27/self_attn/Constant_19_output_0 /blocks.27/self_attn/Constant_19"Constant*F value*:B,/blocks.27/self_attn/Constant_19_attr::valueJ  &/blocks.27/self_attn/Gather_3_output_0 )/blocks.27/self_attn/Constant_19_output_0#/blocks.27/self_attn/Div_1_output_0/blocks.27/self_attn/Div_1"Div y #/blocks.27/self_attn/Div_1_output_0$/blocks.27/self_attn/Cast_2_output_0/blocks.27/self_attn/Cast_2"Cast* to z $/blocks.27/self_attn/Cast_2_output_0$/blocks.27/self_attn/Cast_3_output_0/blocks.27/self_attn/Cast_3"Cast* to )/blocks.27/self_attn/Constant_20_output_0 /blocks.27/self_attn/Constant_20"Constant*H value*<B,/blocks.27/self_attn/Constant_20_attr::valueJ )/blocks.27/self_attn/Constant_21_output_0 /blocks.27/self_attn/Constant_21"Constant*H value*<B,/blocks.27/self_attn/Constant_21_attr::valueJ )/blocks.27/self_attn/Constant_22_output_0 /blocks.27/self_attn/Constant_22"Constant*H value*<B,/blocks.27/self_attn/Constant_22_attr::valueJ  $/blocks.27/self_attn/Cast_3_output_0 )/blocks.27/self_attn/Constant_22_output_0)/blocks.27/self_attn/Unsqueeze_8_output_0 /blocks.27/self_attn/Unsqueeze_8" Unsqueeze )/blocks.27/self_attn/Constant_23_output_0 /blocks.27/self_attn/Constant_23"Constant*H value*<B,/blocks.27/self_attn/Constant_23_attr::valueJ  +/blocks.27/self_attn/k_norm/Cast_2_output_0 )/blocks.27/self_attn/Constant_21_output_0 )/blocks.27/self_attn/Unsqueeze_8_output_0 )/blocks.27/self_attn/Constant_20_output_0 )/blocks.27/self_attn/Constant_23_output_0%/blocks.27/self_attn/Slice_2_output_0/blocks.27/self_attn/Slice_2"Slice )/blocks.27/self_attn/Constant_24_output_0 /blocks.27/self_attn/Constant_24"Constant*H value*<B,/blocks.27/self_attn/Constant_24_attr::valueJ )/blocks.27/self_attn/Constant_25_output_0 /blocks.27/self_attn/Constant_25"Constant*H value*<B,/blocks.27/self_attn/Constant_25_attr::valueJ  $/blocks.27/self_attn/Cast_3_output_0 )/blocks.27/self_attn/Constant_25_output_0)/blocks.27/self_attn/Unsqueeze_9_output_0 /blocks.27/self_attn/Unsqueeze_9" Unsqueeze )/blocks.27/self_attn/Constant_26_output_0 /blocks.27/self_attn/Constant_26"Constant*H value*<B,/blocks.27/self_attn/Constant_26_attr::valueJ )/blocks.27/self_attn/Constant_27_output_0 /blocks.27/self_attn/Constant_27"Constant*H value*<B,/blocks.27/self_attn/Constant_27_attr::valueJ  +/blocks.27/self_attn/k_norm/Cast_2_output_0 )/blocks.27/self_attn/Unsqueeze_9_output_0 )/blocks.27/self_attn/Constant_26_output_0 )/blocks.27/self_attn/Constant_24_output_0 )/blocks.27/self_attn/Constant_27_output_0%/blocks.27/self_attn/Slice_3_output_0/blocks.27/self_attn/Slice_3"Slice m %/blocks.27/self_attn/Slice_3_output_0#/blocks.27/self_attn/Neg_1_output_0/blocks.27/self_attn/Neg_1"Neg  #/blocks.27/self_attn/Neg_1_output_0 %/blocks.27/self_attn/Slice_2_output_0&/blocks.27/self_attn/Concat_4_output_0/blocks.27/self_attn/Concat_4"Concat* axis  &/blocks.27/self_attn/Concat_4_output_0 %/blocks.0/self_attn/Gather_3_output_0#/blocks.27/self_attn/Mul_3_output_0/blocks.27/self_attn/Mul_3"Mul  #/blocks.27/self_attn/Mul_2_output_0 #/blocks.27/self_attn/Mul_3_output_0#/blocks.27/self_attn/Add_1_output_0/blocks.27/self_attn/Add_1"Add  /Gather_27_output_0 /rotary/Constant_3_output_0&/blocks.27/self_attn/Gather_4_output_0/blocks.27/self_attn/Gather_4"Gather* axis  /Gather_27_output_0 /rotary/Constant_8_output_0&/blocks.27/self_attn/Gather_5_output_0/blocks.27/self_attn/Gather_5"Gather* axis  &/blocks.27/self_attn/Gather_4_output_0 #/blocks.27/self_attn/Add_1_output_0&/blocks.27/self_attn/Concat_5_output_0/blocks.27/self_attn/Concat_5"Concat* axis  &/blocks.27/self_attn/Gather_5_output_0 '/blocks.27/self_attn/Reshape_2_output_0&/blocks.27/self_attn/Concat_6_output_0/blocks.27/self_attn/Concat_6"Concat* axis )/blocks.27/self_attn/Constant_28_output_0 /blocks.27/self_attn/Constant_28"Constant*H value*<B,/blocks.27/self_attn/Constant_28_attr::valueJ  &/blocks.27/self_attn/Concat_5_output_0 )/blocks.27/self_attn/Constant_28_output_0*/blocks.27/self_attn/Unsqueeze_10_output_0!/blocks.27/self_attn/Unsqueeze_10" Unsqueeze )/blocks.27/self_attn/Constant_29_output_0 /blocks.27/self_attn/Constant_29"Constant*H value*<B,/blocks.27/self_attn/Constant_29_attr::valueJ  &/blocks.27/self_attn/Concat_6_output_0 )/blocks.27/self_attn/Constant_29_output_0*/blocks.27/self_attn/Unsqueeze_11_output_0!/blocks.27/self_attn/Unsqueeze_11" Unsqueeze  */blocks.27/self_attn/Unsqueeze_10_output_0 */blocks.27/self_attn/Unsqueeze_11_output_0&/blocks.27/self_attn/Concat_7_output_0/blocks.27/self_attn/Concat_7"Concat* axis  !/blocks.27/self_attn/Add_output_0'/blocks.27/self_attn/Transpose_output_0/blocks.27/self_attn/Transpose" Transpose* perm@@@@  &/blocks.27/self_attn/Concat_5_output_0)/blocks.27/self_attn/Transpose_1_output_0 /blocks.27/self_attn/Transpose_1" Transpose* perm@@@@  &/blocks.27/self_attn/Concat_6_output_0)/blocks.27/self_attn/Transpose_2_output_0 /blocks.27/self_attn/Transpose_2" Transpose* perm@@@@ w )/blocks.27/self_attn/Transpose_1_output_0%/blocks.27/self_attn/Shape_4_output_0/blocks.27/self_attn/Shape_4"Shape )/blocks.27/self_attn/Constant_30_output_0 /blocks.27/self_attn/Constant_30"Constant*F value*:B,/blocks.27/self_attn/Constant_30_attr::valueJ  %/blocks.27/self_attn/Shape_4_output_0 )/blocks.27/self_attn/Constant_30_output_0&/blocks.27/self_attn/Gather_6_output_0/blocks.27/self_attn/Gather_6"Gather* axis w )/blocks.27/self_attn/Transpose_1_output_0%/blocks.27/self_attn/Shape_5_output_0/blocks.27/self_attn/Shape_5"Shape )/blocks.27/self_attn/Constant_31_output_0 /blocks.27/self_attn/Constant_31"Constant*F value*:B,/blocks.27/self_attn/Constant_31_attr::valueJ  %/blocks.27/self_attn/Shape_5_output_0 )/blocks.27/self_attn/Constant_31_output_0&/blocks.27/self_attn/Gather_7_output_0/blocks.27/self_attn/Gather_7"Gather* axis w )/blocks.27/self_attn/Transpose_1_output_0%/blocks.27/self_attn/Shape_6_output_0/blocks.27/self_attn/Shape_6"Shape )/blocks.27/self_attn/Constant_32_output_0 /blocks.27/self_attn/Constant_32"Constant*F value*:B,/blocks.27/self_attn/Constant_32_attr::valueJ  %/blocks.27/self_attn/Shape_6_output_0 )/blocks.27/self_attn/Constant_32_output_0&/blocks.27/self_attn/Gather_8_output_0/blocks.27/self_attn/Gather_8"Gather* axis w )/blocks.27/self_attn/Transpose_1_output_0%/blocks.27/self_attn/Shape_7_output_0/blocks.27/self_attn/Shape_7"Shape )/blocks.27/self_attn/Constant_33_output_0 /blocks.27/self_attn/Constant_33"Constant*F value*:B,/blocks.27/self_attn/Constant_33_attr::valueJ  %/blocks.27/self_attn/Shape_7_output_0 )/blocks.27/self_attn/Constant_33_output_0&/blocks.27/self_attn/Gather_9_output_0/blocks.27/self_attn/Gather_9"Gather* axis )/blocks.27/self_attn/Constant_34_output_0 /blocks.27/self_attn/Constant_34"Constant*H value*<B,/blocks.27/self_attn/Constant_34_attr::valueJ  )/blocks.27/self_attn/Transpose_1_output_0 )/blocks.27/self_attn/Constant_34_output_0*/blocks.27/self_attn/Unsqueeze_12_output_0!/blocks.27/self_attn/Unsqueeze_12" Unsqueeze )/blocks.27/self_attn/Constant_35_output_0 /blocks.27/self_attn/Constant_35"Constant*H value*<B,/blocks.27/self_attn/Constant_35_attr::valueJ  &/blocks.27/self_attn/Gather_6_output_0 )/blocks.27/self_attn/Constant_35_output_0*/blocks.27/self_attn/Unsqueeze_13_output_0!/blocks.27/self_attn/Unsqueeze_13" Unsqueeze )/blocks.27/self_attn/Constant_36_output_0 /blocks.27/self_attn/Constant_36"Constant*H value*<B,/blocks.27/self_attn/Constant_36_attr::valueJ  &/blocks.27/self_attn/Gather_7_output_0 )/blocks.27/self_attn/Constant_36_output_0*/blocks.27/self_attn/Unsqueeze_14_output_0!/blocks.27/self_attn/Unsqueeze_14" Unsqueeze )/blocks.27/self_attn/Constant_37_output_0 /blocks.27/self_attn/Constant_37"Constant*H value*<B,/blocks.27/self_attn/Constant_37_attr::valueJ )/blocks.27/self_attn/Constant_38_output_0 /blocks.27/self_attn/Constant_38"Constant*H value*<B,/blocks.27/self_attn/Constant_38_attr::valueJ  &/blocks.27/self_attn/Gather_8_output_0 )/blocks.27/self_attn/Constant_38_output_0*/blocks.27/self_attn/Unsqueeze_15_output_0!/blocks.27/self_attn/Unsqueeze_15" Unsqueeze )/blocks.27/self_attn/Constant_39_output_0 /blocks.27/self_attn/Constant_39"Constant*H value*<B,/blocks.27/self_attn/Constant_39_attr::valueJ  &/blocks.27/self_attn/Gather_9_output_0 )/blocks.27/self_attn/Constant_39_output_0*/blocks.27/self_attn/Unsqueeze_16_output_0!/blocks.27/self_attn/Unsqueeze_16" Unsqueeze  */blocks.27/self_attn/Unsqueeze_13_output_0 */blocks.27/self_attn/Unsqueeze_14_output_0 )/blocks.27/self_attn/Constant_37_output_0 */blocks.27/self_attn/Unsqueeze_15_output_0 */blocks.27/self_attn/Unsqueeze_16_output_0&/blocks.27/self_attn/Concat_8_output_0/blocks.27/self_attn/Concat_8"Concat* axis )/blocks.27/self_attn/Constant_40_output_0 /blocks.27/self_attn/Constant_40"Constant*H value*<B,/blocks.27/self_attn/Constant_40_attr::valueJ  &/blocks.27/self_attn/Concat_8_output_0 )/blocks.27/self_attn/Constant_40_output_0'/blocks.27/self_attn/Reshape_3_output_0/blocks.27/self_attn/Reshape_3"Reshape* allowzero u '/blocks.27/self_attn/Reshape_3_output_0%/blocks.27/self_attn/Shape_8_output_0/blocks.27/self_attn/Shape_8"Shape  %/blocks.27/self_attn/Shape_8_output_0-/blocks.27/self_attn/ConstantOfShape_output_0$/blocks.27/self_attn/ConstantOfShape"ConstantOfShape*L value*@B0/blocks.27/self_attn/ConstantOfShape_attr::valueJ )/blocks.27/self_attn/Constant_41_output_0 /blocks.27/self_attn/Constant_41"Constant*F value*:B,/blocks.27/self_attn/Constant_41_attr::valueJ  -/blocks.27/self_attn/ConstantOfShape_output_0 )/blocks.27/self_attn/Constant_41_output_0#/blocks.27/self_attn/Mul_4_output_0/blocks.27/self_attn/Mul_4"Mul  '/blocks.27/self_attn/Reshape_3_output_0 #/blocks.27/self_attn/Mul_4_output_0#/blocks.27/self_attn/Equal_output_0/blocks.27/self_attn/Equal"Equal  #/blocks.27/self_attn/Equal_output_0 -/blocks.27/self_attn/ConstantOfShape_output_0 '/blocks.27/self_attn/Reshape_3_output_0#/blocks.27/self_attn/Where_output_0/blocks.27/self_attn/Where"Where  */blocks.27/self_attn/Unsqueeze_12_output_0 #/blocks.27/self_attn/Where_output_0$/blocks.27/self_attn/Expand_output_0/blocks.27/self_attn/Expand"Expand )/blocks.27/self_attn/Constant_42_output_0 /blocks.27/self_attn/Constant_42"Constant*F value*:B,/blocks.27/self_attn/Constant_42_attr::valueJ  &/blocks.27/self_attn/Gather_7_output_0 )/blocks.27/self_attn/Constant_42_output_0#/blocks.27/self_attn/Mul_5_output_0/blocks.27/self_attn/Mul_5"Mul fonnx::Unsqueeze_8388 Constant_9795"Constant*5 value*)BConstant_9795_attr::valueJ  &/blocks.27/self_attn/Gather_6_output_0 onnx::Unsqueeze_8388*/blocks.27/self_attn/Unsqueeze_17_output_0!/blocks.27/self_attn/Unsqueeze_17" Unsqueeze fonnx::Unsqueeze_8390 Constant_9797"Constant*5 value*)BConstant_9797_attr::valueJ  #/blocks.27/self_attn/Mul_5_output_0 onnx::Unsqueeze_8390*/blocks.27/self_attn/Unsqueeze_18_output_0!/blocks.27/self_attn/Unsqueeze_18" Unsqueeze fonnx::Unsqueeze_8392 Constant_9799"Constant*5 value*)BConstant_9799_attr::valueJ  &/blocks.27/self_attn/Gather_8_output_0 onnx::Unsqueeze_8392*/blocks.27/self_attn/Unsqueeze_19_output_0!/blocks.27/self_attn/Unsqueeze_19" Unsqueeze fonnx::Unsqueeze_8394 Constant_9801"Constant*5 value*)BConstant_9801_attr::valueJ  &/blocks.27/self_attn/Gather_9_output_0 onnx::Unsqueeze_8394*/blocks.27/self_attn/Unsqueeze_20_output_0!/blocks.27/self_attn/Unsqueeze_20" Unsqueeze  */blocks.27/self_attn/Unsqueeze_17_output_0 */blocks.27/self_attn/Unsqueeze_18_output_0 */blocks.27/self_attn/Unsqueeze_19_output_0 */blocks.27/self_attn/Unsqueeze_20_output_0&/blocks.27/self_attn/Concat_9_output_0/blocks.27/self_attn/Concat_9"Concat* axis  $/blocks.27/self_attn/Expand_output_0 &/blocks.27/self_attn/Concat_9_output_0'/blocks.27/self_attn/Reshape_4_output_0/blocks.27/self_attn/Reshape_4"Reshape* allowzero w )/blocks.27/self_attn/Transpose_2_output_0%/blocks.27/self_attn/Shape_9_output_0/blocks.27/self_attn/Shape_9"Shape )/blocks.27/self_attn/Constant_43_output_0 /blocks.27/self_attn/Constant_43"Constant*F value*:B,/blocks.27/self_attn/Constant_43_attr::valueJ  %/blocks.27/self_attn/Shape_9_output_0 )/blocks.27/self_attn/Constant_43_output_0'/blocks.27/self_attn/Gather_10_output_0/blocks.27/self_attn/Gather_10"Gather* axis y )/blocks.27/self_attn/Transpose_2_output_0&/blocks.27/self_attn/Shape_10_output_0/blocks.27/self_attn/Shape_10"Shape )/blocks.27/self_attn/Constant_44_output_0 /blocks.27/self_attn/Constant_44"Constant*F value*:B,/blocks.27/self_attn/Constant_44_attr::valueJ  &/blocks.27/self_attn/Shape_10_output_0 )/blocks.27/self_attn/Constant_44_output_0'/blocks.27/self_attn/Gather_11_output_0/blocks.27/self_attn/Gather_11"Gather* axis y )/blocks.27/self_attn/Transpose_2_output_0&/blocks.27/self_attn/Shape_11_output_0/blocks.27/self_attn/Shape_11"Shape )/blocks.27/self_attn/Constant_45_output_0 /blocks.27/self_attn/Constant_45"Constant*F value*:B,/blocks.27/self_attn/Constant_45_attr::valueJ  &/blocks.27/self_attn/Shape_11_output_0 )/blocks.27/self_attn/Constant_45_output_0'/blocks.27/self_attn/Gather_12_output_0/blocks.27/self_attn/Gather_12"Gather* axis y )/blocks.27/self_attn/Transpose_2_output_0&/blocks.27/self_attn/Shape_12_output_0/blocks.27/self_attn/Shape_12"Shape )/blocks.27/self_attn/Constant_46_output_0 /blocks.27/self_attn/Constant_46"Constant*F value*:B,/blocks.27/self_attn/Constant_46_attr::valueJ  &/blocks.27/self_attn/Shape_12_output_0 )/blocks.27/self_attn/Constant_46_output_0'/blocks.27/self_attn/Gather_13_output_0/blocks.27/self_attn/Gather_13"Gather* axis )/blocks.27/self_attn/Constant_47_output_0 /blocks.27/self_attn/Constant_47"Constant*H value*<B,/blocks.27/self_attn/Constant_47_attr::valueJ  )/blocks.27/self_attn/Transpose_2_output_0 )/blocks.27/self_attn/Constant_47_output_0*/blocks.27/self_attn/Unsqueeze_21_output_0!/blocks.27/self_attn/Unsqueeze_21" Unsqueeze )/blocks.27/self_attn/Constant_48_output_0 /blocks.27/self_attn/Constant_48"Constant*H value*<B,/blocks.27/self_attn/Constant_48_attr::valueJ  '/blocks.27/self_attn/Gather_10_output_0 )/blocks.27/self_attn/Constant_48_output_0*/blocks.27/self_attn/Unsqueeze_22_output_0!/blocks.27/self_attn/Unsqueeze_22" Unsqueeze )/blocks.27/self_attn/Constant_49_output_0 /blocks.27/self_attn/Constant_49"Constant*H value*<B,/blocks.27/self_attn/Constant_49_attr::valueJ  '/blocks.27/self_attn/Gather_11_output_0 )/blocks.27/self_attn/Constant_49_output_0*/blocks.27/self_attn/Unsqueeze_23_output_0!/blocks.27/self_attn/Unsqueeze_23" Unsqueeze )/blocks.27/self_attn/Constant_50_output_0 /blocks.27/self_attn/Constant_50"Constant*H value*<B,/blocks.27/self_attn/Constant_50_attr::valueJ )/blocks.27/self_attn/Constant_51_output_0 /blocks.27/self_attn/Constant_51"Constant*H value*<B,/blocks.27/self_attn/Constant_51_attr::valueJ  '/blocks.27/self_attn/Gather_12_output_0 )/blocks.27/self_attn/Constant_51_output_0*/blocks.27/self_attn/Unsqueeze_24_output_0!/blocks.27/self_attn/Unsqueeze_24" Unsqueeze )/blocks.27/self_attn/Constant_52_output_0 /blocks.27/self_attn/Constant_52"Constant*H value*<B,/blocks.27/self_attn/Constant_52_attr::valueJ  '/blocks.27/self_attn/Gather_13_output_0 )/blocks.27/self_attn/Constant_52_output_0*/blocks.27/self_attn/Unsqueeze_25_output_0!/blocks.27/self_attn/Unsqueeze_25" Unsqueeze  */blocks.27/self_attn/Unsqueeze_22_output_0 */blocks.27/self_attn/Unsqueeze_23_output_0 )/blocks.27/self_attn/Constant_50_output_0 */blocks.27/self_attn/Unsqueeze_24_output_0 */blocks.27/self_attn/Unsqueeze_25_output_0'/blocks.27/self_attn/Concat_10_output_0/blocks.27/self_attn/Concat_10"Concat* axis )/blocks.27/self_attn/Constant_53_output_0 /blocks.27/self_attn/Constant_53"Constant*H value*<B,/blocks.27/self_attn/Constant_53_attr::valueJ  '/blocks.27/self_attn/Concat_10_output_0 )/blocks.27/self_attn/Constant_53_output_0'/blocks.27/self_attn/Reshape_5_output_0/blocks.27/self_attn/Reshape_5"Reshape* allowzero w '/blocks.27/self_attn/Reshape_5_output_0&/blocks.27/self_attn/Shape_13_output_0/blocks.27/self_attn/Shape_13"Shape  &/blocks.27/self_attn/Shape_13_output_0//blocks.27/self_attn/ConstantOfShape_1_output_0&/blocks.27/self_attn/ConstantOfShape_1"ConstantOfShape*N value*BB2/blocks.27/self_attn/ConstantOfShape_1_attr::valueJ )/blocks.27/self_attn/Constant_54_output_0 /blocks.27/self_attn/Constant_54"Constant*F value*:B,/blocks.27/self_attn/Constant_54_attr::valueJ  //blocks.27/self_attn/ConstantOfShape_1_output_0 )/blocks.27/self_attn/Constant_54_output_0#/blocks.27/self_attn/Mul_6_output_0/blocks.27/self_attn/Mul_6"Mul  '/blocks.27/self_attn/Reshape_5_output_0 #/blocks.27/self_attn/Mul_6_output_0%/blocks.27/self_attn/Equal_1_output_0/blocks.27/self_attn/Equal_1"Equal  %/blocks.27/self_attn/Equal_1_output_0 //blocks.27/self_attn/ConstantOfShape_1_output_0 '/blocks.27/self_attn/Reshape_5_output_0%/blocks.27/self_attn/Where_1_output_0/blocks.27/self_attn/Where_1"Where  */blocks.27/self_attn/Unsqueeze_21_output_0 %/blocks.27/self_attn/Where_1_output_0&/blocks.27/self_attn/Expand_1_output_0/blocks.27/self_attn/Expand_1"Expand )/blocks.27/self_attn/Constant_55_output_0 /blocks.27/self_attn/Constant_55"Constant*F value*:B,/blocks.27/self_attn/Constant_55_attr::valueJ  '/blocks.27/self_attn/Gather_11_output_0 )/blocks.27/self_attn/Constant_55_output_0#/blocks.27/self_attn/Mul_7_output_0/blocks.27/self_attn/Mul_7"Mul fonnx::Unsqueeze_8434 Constant_9840"Constant*5 value*)BConstant_9840_attr::valueJ  '/blocks.27/self_attn/Gather_10_output_0 onnx::Unsqueeze_8434*/blocks.27/self_attn/Unsqueeze_26_output_0!/blocks.27/self_attn/Unsqueeze_26" Unsqueeze fonnx::Unsqueeze_8436 Constant_9842"Constant*5 value*)BConstant_9842_attr::valueJ  #/blocks.27/self_attn/Mul_7_output_0 onnx::Unsqueeze_8436*/blocks.27/self_attn/Unsqueeze_27_output_0!/blocks.27/self_attn/Unsqueeze_27" Unsqueeze fonnx::Unsqueeze_8438 Constant_9844"Constant*5 value*)BConstant_9844_attr::valueJ  '/blocks.27/self_attn/Gather_12_output_0 onnx::Unsqueeze_8438*/blocks.27/self_attn/Unsqueeze_28_output_0!/blocks.27/self_attn/Unsqueeze_28" Unsqueeze fonnx::Unsqueeze_8440 Constant_9846"Constant*5 value*)BConstant_9846_attr::valueJ  '/blocks.27/self_attn/Gather_13_output_0 onnx::Unsqueeze_8440*/blocks.27/self_attn/Unsqueeze_29_output_0!/blocks.27/self_attn/Unsqueeze_29" Unsqueeze  */blocks.27/self_attn/Unsqueeze_26_output_0 */blocks.27/self_attn/Unsqueeze_27_output_0 */blocks.27/self_attn/Unsqueeze_28_output_0 */blocks.27/self_attn/Unsqueeze_29_output_0'/blocks.27/self_attn/Concat_11_output_0/blocks.27/self_attn/Concat_11"Concat* axis  &/blocks.27/self_attn/Expand_1_output_0 '/blocks.27/self_attn/Concat_11_output_0'/blocks.27/self_attn/Reshape_6_output_0/blocks.27/self_attn/Reshape_6"Reshape* allowzero  '/blocks.27/self_attn/Transpose_output_0 '/blocks.27/self_attn/Reshape_4_output_0$/blocks.27/self_attn/MatMul_output_0/blocks.27/self_attn/MatMul"MatMul )/blocks.27/self_attn/Constant_56_output_0 /blocks.27/self_attn/Constant_56"Constant*B value*6B,/blocks.27/self_attn/Constant_56_attr::valueJ5A  $/blocks.27/self_attn/MatMul_output_0 )/blocks.27/self_attn/Constant_56_output_0#/blocks.27/self_attn/Div_2_output_0/blocks.27/self_attn/Div_2"Div { #/blocks.27/self_attn/Div_2_output_0 attention_mask#/blocks.27/self_attn/Add_2_output_0/blocks.27/self_attn/Add_2"Add  #/blocks.27/self_attn/Add_2_output_0%/blocks.27/self_attn/Softmax_output_0/blocks.27/self_attn/Softmax"Softmax* axis { %/blocks.27/self_attn/Softmax_output_0$/blocks.27/self_attn/Cast_4_output_0/blocks.27/self_attn/Cast_4"Cast* to  $/blocks.27/self_attn/Cast_4_output_0 '/blocks.27/self_attn/Reshape_6_output_0&/blocks.27/self_attn/MatMul_1_output_0/blocks.27/self_attn/MatMul_1"MatMul  &/blocks.27/self_attn/MatMul_1_output_0)/blocks.27/self_attn/Transpose_3_output_0 /blocks.27/self_attn/Transpose_3" Transpose* perm@@@@ fonnx::Unsqueeze_8452 Constant_9858"Constant*5 value*)BConstant_9858_attr::valueJ  $/blocks.27/self_attn/Gather_output_0 onnx::Unsqueeze_8452*/blocks.27/self_attn/Unsqueeze_30_output_0!/blocks.27/self_attn/Unsqueeze_30" Unsqueeze fonnx::Unsqueeze_8454 Constant_9860"Constant*5 value*)BConstant_9860_attr::valueJ  &/blocks.27/self_attn/Gather_1_output_0 onnx::Unsqueeze_8454*/blocks.27/self_attn/Unsqueeze_31_output_0!/blocks.27/self_attn/Unsqueeze_31" Unsqueeze )/blocks.27/self_attn/Constant_57_output_0 /blocks.27/self_attn/Constant_57"Constant*H value*<B,/blocks.27/self_attn/Constant_57_attr::valueJ  */blocks.27/self_attn/Unsqueeze_30_output_0 */blocks.27/self_attn/Unsqueeze_31_output_0 )/blocks.27/self_attn/Constant_57_output_0'/blocks.27/self_attn/Concat_12_output_0/blocks.27/self_attn/Concat_12"Concat* axis  )/blocks.27/self_attn/Transpose_3_output_0 '/blocks.27/self_attn/Concat_12_output_0'/blocks.27/self_attn/Reshape_7_output_0/blocks.27/self_attn/Reshape_7"Reshape* allowzero  '/blocks.27/self_attn/Reshape_7_output_0 onnx::MatMul_9345+/blocks.27/self_attn/o_proj/MatMul_output_0"/blocks.27/self_attn/o_proj/MatMul"MatMul  */blocks.27/input_layernorm/Cast_1_output_0 +/blocks.27/self_attn/o_proj/MatMul_output_0/blocks.27/Add_output_0/blocks.27/Add"Add  /blocks.27/Add_output_01/blocks.27/post_attention_layernorm/Cast_output_0(/blocks.27/post_attention_layernorm/Cast"Cast* to 5/blocks.27/post_attention_layernorm/Constant_output_0,/blocks.27/post_attention_layernorm/Constant"Constant*N value*BB8/blocks.27/post_attention_layernorm/Constant_attr::valueJ@  1/blocks.27/post_attention_layernorm/Cast_output_0 5/blocks.27/post_attention_layernorm/Constant_output_00/blocks.27/post_attention_layernorm/Pow_output_0'/blocks.27/post_attention_layernorm/Pow"Pow  0/blocks.27/post_attention_layernorm/Pow_output_07/blocks.27/post_attention_layernorm/ReduceMean_output_0./blocks.27/post_attention_layernorm/ReduceMean" ReduceMean* axes@* keepdims 7/blocks.27/post_attention_layernorm/Constant_1_output_0./blocks.27/post_attention_layernorm/Constant_1"Constant*P value*DB:/blocks.27/post_attention_layernorm/Constant_1_attr::valueJ75  7/blocks.27/post_attention_layernorm/ReduceMean_output_0 7/blocks.27/post_attention_layernorm/Constant_1_output_00/blocks.27/post_attention_layernorm/Add_output_0'/blocks.27/post_attention_layernorm/Add"Add  0/blocks.27/post_attention_layernorm/Add_output_01/blocks.27/post_attention_layernorm/Sqrt_output_0(/blocks.27/post_attention_layernorm/Sqrt"Sqrt 7/blocks.27/post_attention_layernorm/Constant_2_output_0./blocks.27/post_attention_layernorm/Constant_2"Constant*P value*DB:/blocks.27/post_attention_layernorm/Constant_2_attr::valueJ?  7/blocks.27/post_attention_layernorm/Constant_2_output_0 1/blocks.27/post_attention_layernorm/Sqrt_output_00/blocks.27/post_attention_layernorm/Div_output_0'/blocks.27/post_attention_layernorm/Div"Div  1/blocks.27/post_attention_layernorm/Cast_output_03/blocks.27/post_attention_layernorm/Cast_1_output_0*/blocks.27/post_attention_layernorm/Cast_1"Cast* to  3/blocks.27/post_attention_layernorm/Cast_1_output_0 0/blocks.27/post_attention_layernorm/Div_output_00/blocks.27/post_attention_layernorm/Mul_output_0'/blocks.27/post_attention_layernorm/Mul"Mul  0/blocks.27/post_attention_layernorm/Mul_output_0 )blocks.27.post_attention_layernorm.weight2/blocks.27/post_attention_layernorm/Mul_1_output_0)/blocks.27/post_attention_layernorm/Mul_1"Mul  2/blocks.27/post_attention_layernorm/Mul_1_output_03/blocks.27/post_attention_layernorm/Cast_2_output_0*/blocks.27/post_attention_layernorm/Cast_2"Cast* to  3/blocks.27/post_attention_layernorm/Cast_2_output_0 onnx::MatMul_9346(/blocks.27/mlp/gate_proj/MatMul_output_0/blocks.27/mlp/gate_proj/MatMul"MatMul z (/blocks.27/mlp/gate_proj/MatMul_output_0&/blocks.27/mlp/act_fn/Sigmoid_output_0/blocks.27/mlp/act_fn/Sigmoid"Sigmoid  (/blocks.27/mlp/gate_proj/MatMul_output_0 &/blocks.27/mlp/act_fn/Sigmoid_output_0"/blocks.27/mlp/act_fn/Mul_output_0/blocks.27/mlp/act_fn/Mul"Mul  3/blocks.27/post_attention_layernorm/Cast_2_output_0 onnx::MatMul_9347&/blocks.27/mlp/up_proj/MatMul_output_0/blocks.27/mlp/up_proj/MatMul"MatMul  "/blocks.27/mlp/act_fn/Mul_output_0 &/blocks.27/mlp/up_proj/MatMul_output_0/blocks.27/mlp/Mul_output_0/blocks.27/mlp/Mul"Mul  /blocks.27/mlp/Mul_output_0 onnx::MatMul_9348(/blocks.27/mlp/down_proj/MatMul_output_0/blocks.27/mlp/down_proj/MatMul"MatMul  3/blocks.27/post_attention_layernorm/Cast_1_output_0 (/blocks.27/mlp/down_proj/MatMul_output_0/blocks.27/Add_1_output_0/blocks.27/Add_1"Add e/Constant_20_output_0 /Constant_20"Constant*4 value*(B/Constant_20_attr::valueJ e/Constant_21_output_0 /Constant_21"Constant*4 value*(B/Constant_21_attr::valueJ e/Constant_22_output_0 /Constant_22"Constant*4 value*(B/Constant_22_attr::valueJ c /blocks.27/Add_1_output_0/final_layernorm/Cast_output_0/final_layernorm/Cast"Cast* to "/final_layernorm/Constant_output_0/final_layernorm/Constant"Constant*; value*/B%/final_layernorm/Constant_attr::valueJ@ ~ /final_layernorm/Cast_output_0 "/final_layernorm/Constant_output_0/final_layernorm/Pow_output_0/final_layernorm/Pow"Pow  /final_layernorm/Pow_output_0$/final_layernorm/ReduceMean_output_0/final_layernorm/ReduceMean" ReduceMean* axes@* keepdims $/final_layernorm/Constant_1_output_0/final_layernorm/Constant_1"Constant*= value*1B'/final_layernorm/Constant_1_attr::valueJ75  $/final_layernorm/ReduceMean_output_0 $/final_layernorm/Constant_1_output_0/final_layernorm/Add_output_0/final_layernorm/Add"Add \ /final_layernorm/Add_output_0/final_layernorm/Sqrt_output_0/final_layernorm/Sqrt"Sqrt $/final_layernorm/Constant_2_output_0/final_layernorm/Constant_2"Constant*= value*1B'/final_layernorm/Constant_2_attr::valueJ?  $/final_layernorm/Constant_2_output_0 /final_layernorm/Sqrt_output_0/final_layernorm/Div_output_0/final_layernorm/Div"Div y /final_layernorm/Cast_output_0 /final_layernorm/Div_output_0/final_layernorm/Mul_output_0/final_layernorm/Mul"Mul k /final_layernorm/Mul_output_0 /final_layernorm/Cast_1_output_0/final_layernorm/Cast_1"Cast* to f final_layernorm.weight /final_layernorm/Cast_1_output_0 hidden_states/final_layernorm/Mul_1"Mul A hidden_states onnx::MatMul_9352logits /lm/lm/MatMul"MatMul e/Constant_23_output_0 /Constant_23"Constant*4 value*(B/Constant_23_attr::valueJ j %/blocks.0/self_attn/Concat_7_output_0 /Constant_23_output_0/Unsqueeze_output_0 /Unsqueeze" Unsqueeze e/Constant_24_output_0 /Constant_24"Constant*4 value*(B/Constant_24_attr::valueJ n %/blocks.1/self_attn/Concat_7_output_0 /Constant_24_output_0/Unsqueeze_1_output_0 /Unsqueeze_1" Unsqueeze e/Constant_25_output_0 /Constant_25"Constant*4 value*(B/Constant_25_attr::valueJ n %/blocks.2/self_attn/Concat_7_output_0 /Constant_25_output_0/Unsqueeze_2_output_0 /Unsqueeze_2" Unsqueeze e/Constant_26_output_0 /Constant_26"Constant*4 value*(B/Constant_26_attr::valueJ n %/blocks.3/self_attn/Concat_7_output_0 /Constant_26_output_0/Unsqueeze_3_output_0 /Unsqueeze_3" Unsqueeze e/Constant_27_output_0 /Constant_27"Constant*4 value*(B/Constant_27_attr::valueJ n %/blocks.4/self_attn/Concat_7_output_0 /Constant_27_output_0/Unsqueeze_4_output_0 /Unsqueeze_4" Unsqueeze e/Constant_28_output_0 /Constant_28"Constant*4 value*(B/Constant_28_attr::valueJ n %/blocks.5/self_attn/Concat_7_output_0 /Constant_28_output_0/Unsqueeze_5_output_0 /Unsqueeze_5" Unsqueeze e/Constant_29_output_0 /Constant_29"Constant*4 value*(B/Constant_29_attr::valueJ n %/blocks.6/self_attn/Concat_7_output_0 /Constant_29_output_0/Unsqueeze_6_output_0 /Unsqueeze_6" Unsqueeze e/Constant_30_output_0 /Constant_30"Constant*4 value*(B/Constant_30_attr::valueJ n %/blocks.7/self_attn/Concat_7_output_0 /Constant_30_output_0/Unsqueeze_7_output_0 /Unsqueeze_7" Unsqueeze e/Constant_31_output_0 /Constant_31"Constant*4 value*(B/Constant_31_attr::valueJ n %/blocks.8/self_attn/Concat_7_output_0 /Constant_31_output_0/Unsqueeze_8_output_0 /Unsqueeze_8" Unsqueeze e/Constant_32_output_0 /Constant_32"Constant*4 value*(B/Constant_32_attr::valueJ n %/blocks.9/self_attn/Concat_7_output_0 /Constant_32_output_0/Unsqueeze_9_output_0 /Unsqueeze_9" Unsqueeze e/Constant_33_output_0 /Constant_33"Constant*4 value*(B/Constant_33_attr::valueJ q &/blocks.10/self_attn/Concat_7_output_0 /Constant_33_output_0/Unsqueeze_10_output_0 /Unsqueeze_10" Unsqueeze e/Constant_34_output_0 /Constant_34"Constant*4 value*(B/Constant_34_attr::valueJ q &/blocks.11/self_attn/Concat_7_output_0 /Constant_34_output_0/Unsqueeze_11_output_0 /Unsqueeze_11" Unsqueeze e/Constant_35_output_0 /Constant_35"Constant*4 value*(B/Constant_35_attr::valueJ q &/blocks.12/self_attn/Concat_7_output_0 /Constant_35_output_0/Unsqueeze_12_output_0 /Unsqueeze_12" Unsqueeze e/Constant_36_output_0 /Constant_36"Constant*4 value*(B/Constant_36_attr::valueJ q &/blocks.13/self_attn/Concat_7_output_0 /Constant_36_output_0/Unsqueeze_13_output_0 /Unsqueeze_13" Unsqueeze e/Constant_37_output_0 /Constant_37"Constant*4 value*(B/Constant_37_attr::valueJ q &/blocks.14/self_attn/Concat_7_output_0 /Constant_37_output_0/Unsqueeze_14_output_0 /Unsqueeze_14" Unsqueeze e/Constant_38_output_0 /Constant_38"Constant*4 value*(B/Constant_38_attr::valueJ q &/blocks.15/self_attn/Concat_7_output_0 /Constant_38_output_0/Unsqueeze_15_output_0 /Unsqueeze_15" Unsqueeze e/Constant_39_output_0 /Constant_39"Constant*4 value*(B/Constant_39_attr::valueJ q &/blocks.16/self_attn/Concat_7_output_0 /Constant_39_output_0/Unsqueeze_16_output_0 /Unsqueeze_16" Unsqueeze e/Constant_40_output_0 /Constant_40"Constant*4 value*(B/Constant_40_attr::valueJ q &/blocks.17/self_attn/Concat_7_output_0 /Constant_40_output_0/Unsqueeze_17_output_0 /Unsqueeze_17" Unsqueeze e/Constant_41_output_0 /Constant_41"Constant*4 value*(B/Constant_41_attr::valueJ q &/blocks.18/self_attn/Concat_7_output_0 /Constant_41_output_0/Unsqueeze_18_output_0 /Unsqueeze_18" Unsqueeze e/Constant_42_output_0 /Constant_42"Constant*4 value*(B/Constant_42_attr::valueJ q &/blocks.19/self_attn/Concat_7_output_0 /Constant_42_output_0/Unsqueeze_19_output_0 /Unsqueeze_19" Unsqueeze e/Constant_43_output_0 /Constant_43"Constant*4 value*(B/Constant_43_attr::valueJ q &/blocks.20/self_attn/Concat_7_output_0 /Constant_43_output_0/Unsqueeze_20_output_0 /Unsqueeze_20" Unsqueeze e/Constant_44_output_0 /Constant_44"Constant*4 value*(B/Constant_44_attr::valueJ q &/blocks.21/self_attn/Concat_7_output_0 /Constant_44_output_0/Unsqueeze_21_output_0 /Unsqueeze_21" Unsqueeze e/Constant_45_output_0 /Constant_45"Constant*4 value*(B/Constant_45_attr::valueJ q &/blocks.22/self_attn/Concat_7_output_0 /Constant_45_output_0/Unsqueeze_22_output_0 /Unsqueeze_22" Unsqueeze e/Constant_46_output_0 /Constant_46"Constant*4 value*(B/Constant_46_attr::valueJ q &/blocks.23/self_attn/Concat_7_output_0 /Constant_46_output_0/Unsqueeze_23_output_0 /Unsqueeze_23" Unsqueeze e/Constant_47_output_0 /Constant_47"Constant*4 value*(B/Constant_47_attr::valueJ q &/blocks.24/self_attn/Concat_7_output_0 /Constant_47_output_0/Unsqueeze_24_output_0 /Unsqueeze_24" Unsqueeze e/Constant_48_output_0 /Constant_48"Constant*4 value*(B/Constant_48_attr::valueJ q &/blocks.25/self_attn/Concat_7_output_0 /Constant_48_output_0/Unsqueeze_25_output_0 /Unsqueeze_25" Unsqueeze e/Constant_49_output_0 /Constant_49"Constant*4 value*(B/Constant_49_attr::valueJ q &/blocks.26/self_attn/Concat_7_output_0 /Constant_49_output_0/Unsqueeze_26_output_0 /Unsqueeze_26" Unsqueeze e/Constant_50_output_0 /Constant_50"Constant*4 value*(B/Constant_50_attr::valueJ q &/blocks.27/self_attn/Concat_7_output_0 /Constant_50_output_0/Unsqueeze_27_output_0 /Unsqueeze_27" Unsqueeze  /Unsqueeze_output_0 /Unsqueeze_1_output_0 /Unsqueeze_2_output_0 /Unsqueeze_3_output_0 /Unsqueeze_4_output_0 /Unsqueeze_5_output_0 /Unsqueeze_6_output_0 /Unsqueeze_7_output_0 /Unsqueeze_8_output_0 /Unsqueeze_9_output_0 /Unsqueeze_10_output_0 /Unsqueeze_11_output_0 /Unsqueeze_12_output_0 /Unsqueeze_13_output_0 /Unsqueeze_14_output_0 /Unsqueeze_15_output_0 /Unsqueeze_16_output_0 /Unsqueeze_17_output_0 /Unsqueeze_18_output_0 /Unsqueeze_19_output_0 /Unsqueeze_20_output_0 /Unsqueeze_21_output_0 /Unsqueeze_22_output_0 /Unsqueeze_23_output_0 /Unsqueeze_24_output_0 /Unsqueeze_25_output_0 /Unsqueeze_26_output_0 /Unsqueeze_27_output_0presents/Concat"Concat* axis main_graph*lBblocks.0.input_layernorm.weightj% locationqwen3_0.6B_fp32.onnx.dataj offset0j length4096p*xB(blocks.0.post_attention_layernorm.weightj% locationqwen3_0.6B_fp32.onnx.dataj offset4096j length4096p*B blocks.0.self_attn.k_norm.weightJ?@@@?"@@@?@@=@@@ @@@@??@#@@?@@!@ @7@@-@#>@&@.@b@@X@@ @@y@@ @?<@??@B?@??@?6@@?'@??%@{?%@n@??V@o@?? @$@@?;?@@@@ @?? @#@@A@@?@8@@,@8@@d@4@6@@@ @8@ @@8@ @/@?6@@??B??@3@"@G@@ @0@@&@3@@*B blocks.0.self_attn.q_norm.weightJ@?<?&@???1@@?????@ @ @? @@?@?)@??^@?>>H@????@ @?@??@*oBblocks.1.input_layernorm.weightj% locationqwen3_0.6B_fp32.onnx.dataj offset8192j length4096p*yB(blocks.1.post_attention_layernorm.weightj% locationqwen3_0.6B_fp32.onnx.dataj offset12288j length4096p*B blocks.1.self_attn.k_norm.weightJ@p?@?@}>U????????@?1@??=@5@??:@G@@@P@@U@<?8@u@ @@I@?@@@/@?? @??&??2B2@?@@?7@ @@???@1?@???@?u?W?&@??H???@? @@??@r@@,@*@7@?W@=7@R@?w&@L@@@?@???/@@??@??@?w??'@?@@P@?7@@ @*B blocks.1.self_attn.q_norm.weightJ>P@K????N@ ]@@@X@??=???@?????w???h??N????U???@\?4@??????????@?X>?(@>??x???@?@W?@W???@B@t@? @?J@?????????M??????m?T@M?a???z?h??K??>@?????????4?5?? @??? @?@???*pBblocks.2.input_layernorm.weightj% locationqwen3_0.6B_fp32.onnx.dataj offset16384j length4096p*yB(blocks.2.post_attention_layernorm.weightj% locationqwen3_0.6B_fp32.onnx.dataj offset20480j length4096p*B blocks.2.self_attn.k_norm.weightJ?@@*@@@@<s@??@@h@,@??[?@>?@???H???@??? @@??@???????????????@???@? @@?@???I@@@A<z@?G@@Y;-@@.@=->3??????k??u@??@???@(@?????@??@@??Q@?????0B?? @@?@?????*B blocks.2.self_attn.q_norm.weightJ??>-?>?=??!?@=0?3???@G@?@???@????!????????"???!@??@????@?????g???????@!@???4@R?Z<A?>?<?a?? @??:??7@]@@????&@?l????????????????????????@??=??????? @???*pBblocks.3.input_layernorm.weightj% locationqwen3_0.6B_fp32.onnx.dataj offset24576j length4096p*yB(blocks.3.post_attention_layernorm.weightj% locationqwen3_0.6B_fp32.onnx.dataj offset28672j length4096p*B blocks.3.self_attn.k_norm.weightJ?~???9@x?????>?@??v>???'@????:??? @?&;?y???@?3@??@?@@?@@?r=??@?@@ @"@?&@5@@@??:H?j?>??'?m>N?@?? @????????(@??????@?@???????@n@??@?{?D@A????? @@@ @@@@8@*B blocks.3.self_attn.q_norm.weightJ@?i@@{@?@?@@?@?>? @#@????????@?@@??=?O@???N>????????#@?[?@@;@???????@??@+@@?@@_@?7@?5@?@@@??@??????@??<>???@???i>???n@?@??-?o??@?@@g? @? @??????????*pBblocks.4.input_layernorm.weightj% locationqwen3_0.6B_fp32.onnx.dataj offset32768j length4096p*yB(blocks.4.post_attention_layernorm.weightj% locationqwen3_0.6B_fp32.onnx.dataj offset36864j length4096p*B blocks.4.self_attn.k_norm.weightJ??@9?-@?8@c?$@?@?@?d@:@@?W@@?@@l@@@>p@A@@@w:@^@u@@@r@5@H@A@8@v@d@@7@?????? A??)@>@???+@J?@???>@?@?@@9@@??@@?@*@@@o??A@@A@@@r@E@@R@I@@?@^@@@Y=3@g@@=@V@@'B?????(?????@1@)@?*B blocks.4.self_attn.q_norm.weightJ??x???:??Y??z???????5@?>?+???>=?>>?$?>>K?@?A?#??>3?|?q?<5??K?c??q?}??????&>???g??@?????????{???@?R?r???>m???t?@?>>G>?>?Q?=/?C????E????l?F???d? ?;?????@???????.@*pBblocks.5.input_layernorm.weightj% locationqwen3_0.6B_fp32.onnx.dataj offset40960j length4096p*yB(blocks.5.post_attention_layernorm.weightj% locationqwen3_0.6B_fp32.onnx.dataj offset45056j length4096p*B blocks.5.self_attn.k_norm.weightJ??? @a?????+???@???B@>@W@@ @:@@A@@a@@??@??@>@U@@?@?#<@?_@ @??@?A@ @*@@??x??^@?????P@j?9@@?????>>????>? @?\>?b@?@@@@H@@@@?~@ @?9 @ @?@?A@? @@?? @?>@@A???B@??@@@?@*B blocks.5.self_attn.q_norm.weightJn@???6@???@@????@?g?n?L???s??b??J?@?@j????n?=?? ??@??K??????==??S?;??? @?P??????Y?d@^?|??K@???@@?@??@???@?D?? ??'??K>????.???@??i??N=??????????? >???(? @??)????*pBblocks.6.input_layernorm.weightj% locationqwen3_0.6B_fp32.onnx.dataj offset49152j length4096p*yB(blocks.6.post_attention_layernorm.weightj% locationqwen3_0.6B_fp32.onnx.dataj offset53248j length4096p*B blocks.6.self_attn.k_norm.weightJ??>??@?@f@??)9@?>@???@@@"@#@?i@?@?@? @ @@@@$@@@?6@????????Y@?@@:@l@,@C@9@Y@@@C@A>==Q:R@f@@@n@A?@]??]@?@>?!?G?o@|??@?@!@ ?@?@??@?;@?@??@?@@??+@?@AF@ @i@@/@C@8@Y@@@E@A*B blocks.6.self_attn.q_norm.weightJ?@? @@?`???R?@?_@?x?"@)?f@?@??_???@y??y????????Y?????? @?? @?@@d@?? @??????????.??@G?@E= ?R?"?;K?@?g@?^?@"?@?@?????<@??????????@?????????@+@?&@@>?@?@?????@??*pBblocks.7.input_layernorm.weightj% locationqwen3_0.6B_fp32.onnx.dataj offset57344j length4096p*yB(blocks.7.post_attention_layernorm.weightj% locationqwen3_0.6B_fp32.onnx.dataj offset61440j length4096p*B blocks.7.self_attn.k_norm.weightJZ?@??>1??}?i?????@?:?F?T?#?l@x?R????:?@h?@??? A???f>??>???y??@N@>E@g@?E@ @`@ @@?@@>??7????9?@9@?????p@??@? @>??A@???@??@@~????<???A??@$??9@?@I?Z?A??j@??@??@@#@*B blocks.7.self_attn.q_norm.weightJ|@j??=@?A@@_@??p???'@k????@ @v?>#<?@???@?? @????>?? @???@???@?>S?E@E?1??W??J???1@??@]??E@?? @@??C?7@?@??D??????@??[????A>??^?@??? @???>??>n@?^???@9@<??0?????????*pBblocks.8.input_layernorm.weightj% locationqwen3_0.6B_fp32.onnx.dataj offset65536j length4096p*yB(blocks.8.post_attention_layernorm.weightj% locationqwen3_0.6B_fp32.onnx.dataj offset69632j length4096p*B blocks.8.self_attn.k_norm.weightJy;ػ??;?S:y????:?? @?@??@3@@???????????????????@E@??%@???A?4@??? @?@@ @ @W@?> ~<???:?;?$@?@\@????@???????@????@???4@????????@ @?????7@????? @ @?'@{@*B blocks.8.self_attn.q_norm.weightJ?"??=?=???D?d??}??4???@???s???????????????????????????@????????@???@??E>?.????g=?h??o??-???@??????????????P??????????????????@??????@??@??*pBblocks.9.input_layernorm.weightj% locationqwen3_0.6B_fp32.onnx.dataj offset73728j length4096p*yB(blocks.9.post_attention_layernorm.weightj% locationqwen3_0.6B_fp32.onnx.dataj offset77824j length4096p*B blocks.9.self_attn.k_norm.weightJ>[??L?>>9>??S?,@?W?K@c@@?@???><@?@??:?????$A??2@???A?1@ @?NA???@@???k?-@ @??@?@??+?U? o@> ? @R:>ҹ?0@?@?B@l?S@@?@'@? @?@?@???$<@?????=?@?@??=@????XA@??@*@?H@?@>@*B blocks.9.self_attn.q_norm.weightJ'@??>@@@??I@????;?>?????@5???????????>??????>????>@?+@???y@@I@??? @?@?6@,@/@?@@y?\?s@? T@V?L<??j? ?? ??Y??>!?????+??????p???@???????????? @@?>?@???&@????*qB blocks.10.input_layernorm.weightj% locationqwen3_0.6B_fp32.onnx.dataj offset81920j length4096p*zB)blocks.10.post_attention_layernorm.weightj% locationqwen3_0.6B_fp32.onnx.dataj offset86016j length4096p*B!blocks.10.self_attn.k_norm.weightJd?+@X 9?O??2@??8?@?? @=@?n@??@??@x?'@.@P@+@???ǹ??@@?@?@? @>C????A.@?@>???? @?@?@@W@@?s?? ??='?@:?>??????_? @???@?>>???????V@?????>@???%?>???H???"A?? @??@??,@?'@*B!blocks.10.self_attn.q_norm.weightJ@-?@@?&@?8???A?????n??D???q????-@b?]?V?r????@??>??U=@??? A_@@??:b??}@?? @??@???O?6?@S??@?F@?d???@??????@????c???@???????=?????c@???@z@@ @?????>?@????@??@?*qB blocks.11.input_layernorm.weightj% locationqwen3_0.6B_fp32.onnx.dataj offset90112j length4096p*zB)blocks.11.post_attention_layernorm.weightj% locationqwen3_0.6B_fp32.onnx.dataj offset94208j length4096p*B!blocks.11.self_attn.k_norm.weightJ>??.=P>=@[@? p;,@L??:B@a@?d@>@E@? @?@??? @?@@ @ @ @@@)@@ @??h@@2@&@!@ @@@@@@X@-@@u@=@g@@@<?@???@<?R@@?-@@?@ @j>@.@? @??F???@???@???@C@@'@@ @ @]@??@@@-@ @@@@@@R@.@@q@=@@@*B!blocks.11.self_attn.q_norm.weightJ?>;?.=<??0?"@:@y????#?@??@??"@????@?@? @?@@@?@@@@?@?E@@?@???????? @?@@?@???>@?@ @?=H?==@????(????@??@??@?@???@@@+@@@@?@?????@@&@@@????? @ @?!@@?@@?*qB blocks.12.input_layernorm.weightj% locationqwen3_0.6B_fp32.onnx.dataj offset98304j length4096p*{B)blocks.12.post_attention_layernorm.weightj% locationqwen3_0.6B_fp32.onnx.dataj offset102400j length4096p*B!blocks.12.self_attn.k_norm.weightJ?$?;=;@9;?@|Q??????"@S??M???@? @??@???@ @@@@?>???%@?D@????A???}?????v@$@@?@@(??8< @?)?O?a?;=?E?;>@S;?/@???z:??@@Z?@??>@???@??<@??? @??@;@?? @???m?????@?@?)@@*B!blocks.12.self_attn.q_norm.weightJ+@@2@z?t?>+@@?$>G@@n?@@?.???@@????/@???@???????Y@??????????>??%@B@????????$@?=@=??<H@E@B=?t@8@=q?@@?0???@????^@???a@??????@??????@???????@>@??????????*rB blocks.13.input_layernorm.weightj% locationqwen3_0.6B_fp32.onnx.dataj offset106496j length4096p*{B)blocks.13.post_attention_layernorm.weightj% locationqwen3_0.6B_fp32.onnx.dataj offset110592j length4096p*B!blocks.13.self_attn.k_norm.weightJ?><?@4?>?@@??8;?A?@????=@??@x@???@?@@ @?D@?@@@??@@?-@ @????+@T?@ @@?@#@?$@C@> =?>@1>%?????f????? @<@@????@3@<@?@?@?#@@@??@@@?@??@?@????@H?@@@ @@@@@2@*B!blocks.13.self_attn.q_norm.weightJ@>@?=}@@@<?)???@v=?@???????@?X??????d??????????@@?????????@??@9@??@??@;@>?Tz@@@@?9???@??@?????????j??????????????????@d@?@??????@??@???@3@@*rB blocks.14.input_layernorm.weightj% locationqwen3_0.6B_fp32.onnx.dataj offset114688j length4096p*{B)blocks.14.post_attention_layernorm.weightj% locationqwen3_0.6B_fp32.onnx.dataj offset118784j length4096p*B!blocks.14.self_attn.k_norm.weightJ?,?>?#:?:@;X@p???@@???j?@??-@? @?? @????7@@?????@?@?PA@l?+@8@???? @@@@@@@&@(@???U???!??g>>??v@;/:?O@H@h@? @??C@?L@??@???H@??@@@???@ @??%@?@?G@@???@?@?@@@@<@&@*B!blocks.14.self_attn.q_norm.weightJ@@<??@?o>=@@?<?8@5@>Y?[?i?????????????????????@?@????>?v@?????????????@?@???c@D=@0@@@N??#?3@6@?d?i?`???????t????@??????????????????{@r???@??@?@?????,@*rB blocks.15.input_layernorm.weightj% locationqwen3_0.6B_fp32.onnx.dataj offset122880j length4096p*{B)blocks.15.post_attention_layernorm.weightj% locationqwen3_0.6B_fp32.onnx.dataj offset126976j length4096p*B!blocks.15.self_attn.k_norm.weightJA@@ƺ?9???? >?@,???T?M@@{?0@?????`@@ @?@?G@??@ @?@P>@g@Q@???? @???@?? @?????@@? @SA@@?6>???X?=?b@.:??7??,@??@@%@????@???@?????(A@?@>@#@U@@R@?A????@????@ @@?@*B!blocks.15.self_attn.q_norm.weightJ ;?F;#@?????? @?l????k?????????o????\?@???????????'@?@?????? @???@:@@.@??@?>U<>.@<?K?A=??? @?d?ȼ????????????????????????>? @???|?P?i?@f>@@?????@@?@?7@?*rB blocks.16.input_layernorm.weightj% locationqwen3_0.6B_fp32.onnx.dataj offset131072j length4096p*{B)blocks.16.post_attention_layernorm.weightj% locationqwen3_0.6B_fp32.onnx.dataj offset135168j length4096p*B!blocks.16.self_attn.k_norm.weightJ=:;?$<?`<>4m@P=?@ @@?+>e@0@@?@@???@.@@@??@%@?@l??@??@@@F@@? @@@@??0@?@*@6@m@%@@6@t??=G>h??e?y?#@-??@?@>?k@W@?@,@?b@@ @ @h@>@@*@+@@@?@ @ @@?@?!@,@??@6@AE@@@@@/@??@??$@5@l@.@@@*B!blocks.16.self_attn.q_norm.weightJ(@<V?>?;?<???*=B??n???@y???????????@?????@??@?@#@??@??@@???@@?f@???/@W@7@@@?\<>??????,?@A??o???@????????????????@??}????@#@@?/???@???@@@:@*@???@P@I@*rB blocks.17.input_layernorm.weightj% locationqwen3_0.6B_fp32.onnx.dataj offset139264j length4096p*{B)blocks.17.post_attention_layernorm.weightj% locationqwen3_0.6B_fp32.onnx.dataj offset143360j length4096p*B!blocks.17.self_attn.k_norm.weightJ??=?=>>+?v@v@;?@@@?<@???<@?@ @?@?@?"@?@e?@@?@??;@?@?@6@@@?@?@@@ @@7@>??@(@?@=Ľ?O?Q? @?@0??<*@@G@:@?@4? @?????u?@?@?@@l@?'@@@@@@?r@@?.@U@?@A@??J@?@@>??9@ @?@*B!blocks.17.self_attn.q_norm.weightJ(@<&=?f?=@ ?N?= @??V??????????@?????????????@?@?@????@? @??@???A>@<@@?3@?<?=?b@m<u??@"?S???*?>d????@?????@??????????????q????@??@?>???????@c@7@? @>@@*rB blocks.18.input_layernorm.weightj% locationqwen3_0.6B_fp32.onnx.dataj offset147456j length4096p*{B)blocks.18.post_attention_layernorm.weightj% locationqwen3_0.6B_fp32.onnx.dataj offset151552j length4096p*B!blocks.18.self_attn.k_norm.weightJh?<<??J?=>?<?YM@???<@1@?@?????@??1@@?@? @@?*???@@?*@#@*@E@"@]??@@@@@?%@@+@1@*@e@@*@??@'=<???:?I=?>?:?0@n?U?`???A@J@???@@@?&@@C@??G@@?*@;@@Y@ @?@<@?@R@@@@ @?@(@?%@1@2@X@ @7@?*B!blocks.18.self_attn.q_norm.weightJ??=R?<??;Q???<??@?????????@????O?@?????@@?????????0@??????'@??????@@#@??o????=??@??@????????@@?????????@?????????????????????@???? @D@!@*rB blocks.19.input_layernorm.weightj% locationqwen3_0.6B_fp32.onnx.dataj offset155648j length4096p*{B)blocks.19.post_attention_layernorm.weightj% locationqwen3_0.6B_fp32.onnx.dataj offset159744j length4096p*B!blocks.19.self_attn.k_norm.weightJ?x?>?"=(><??]?$?%;K@?J?@@?"@?s@@~?@@?@@?@@??-?@@?@R@@@@@ @A%@@?@@@@@@@?@? @<@H@? <???0@???$@???b@@? @??!@??@@2@@$@J@<@@? @/@{@&@? @?@?@?@@@t?@?@? @? @@@@?!@? @)@=@*B!blocks.19.self_attn.q_norm.weightJ?t?b<?4<?7<?>=+@?@ =?????????????$@??????@@??@???@?_??A???????????@?u@????<?@Y<@? @=*@*@??@?????@???????????@"@????@?@?? @??@@??????????@?t@??7@*rB blocks.20.input_layernorm.weightj% locationqwen3_0.6B_fp32.onnx.dataj offset163840j length4096p*{B)blocks.20.post_attention_layernorm.weightj% locationqwen3_0.6B_fp32.onnx.dataj offset167936j length4096p*B!blocks.20.self_attn.k_norm.weightJw? @=;o?J?/@f?]@?={???<@??P?}??@?@}???@?@?@? @???@@??@@@@;@ @]@A@? @@@ @@0@@;@ @@?@V@@?b?<?`?";;?W@??A;???l??@?;?)???@?N?@?@?@??0@>?@??*@ @@?@?@? @ @@@@ @?)@@-@@@@@@*B!blocks.20.self_attn.q_norm.weightJ@?<K=;:d?]?g??]?;???z?????????K@????? @????@???@@?????@???????????? @@??@==?!@=?@?>=<?\???;???@???? @?<@???????????@@?@ @??@@?@o?@??????????? @(@,@@@*rB blocks.21.input_layernorm.weightj% locationqwen3_0.6B_fp32.onnx.dataj offset172032j length4096p*{B)blocks.21.post_attention_layernorm.weightj% locationqwen3_0.6B_fp32.onnx.dataj offset176128j length4096p*B!blocks.21.self_attn.k_norm.weightJ?<=%<Z;??8? @t<l?????o???@C@@E>?@?@??@'@?@?????@????@? @0@?@????@?@?!@*@?.@C@2@4>q?=?9w?=Q??=^;?<?/@<?>'@ @&@@?0@ @?@???@?@@???1@@?@?@1@?*A???@?@?@*@?-@e@K@*B!blocks.21.self_attn.q_norm.weightJ? =><?????;?@?????@ @????????????_??@@???? @@???@?@?@?????? @??!@????2?=?92??<<???E @<??@?????|?????@?@?@?@9??@@ @????5@ @?????????@??%@??>@*rB blocks.22.input_layernorm.weightj% locationqwen3_0.6B_fp32.onnx.dataj offset180224j length4096p*{B)blocks.22.post_attention_layernorm.weightj% locationqwen3_0.6B_fp32.onnx.dataj offset184320j length4096p*B!blocks.22.self_attn.k_norm.weightJ?;c????@9??@?J;%?9?@??????@@??P??????@?????@?????S@??????@??@?@ @"@Z@@a?k<i; ;: ???[?o????@*???>???????6@?????>?????m>??@???9@???????@?? @@@@@@*B!blocks.22.self_attn.q_norm.weightJ?<W?@z???;????=?j@????????*????@@????I??@???(???@??Y???????^????????? @?<_;@F?,????;@???????@?????????????@?@???@????????????@?????????*rB blocks.23.input_layernorm.weightj% locationqwen3_0.6B_fp32.onnx.dataj offset188416j length4096p*{B)blocks.23.post_attention_layernorm.weightj% locationqwen3_0.6B_fp32.onnx.dataj offset192512j length4096p*B!blocks.23.self_attn.k_norm.weightJ??<??)=9?1=S?:<)@?@@@%????@@?@D? @?@q@???%@%@????@Y@@?@@?0@A@ @@@ @@G@@@@9@@K@@???r?"?ǹ;???.@@?@??>>?? @?Q@5@T????c@???3???@??@@???@>??=@N@@>?@@@@@F@@@@B@@c@@?*B!blocks.23.self_attn.q_norm.weightJ?'@?=@ @@<???@?w??????????????? @?t???????@????E???Q? @?>???????J?U???S??@2@?@<? @@@???@???@??????????????????@???????/@????L? @???????\?>???R???@*rB blocks.24.input_layernorm.weightj% locationqwen3_0.6B_fp32.onnx.dataj offset196608j length4096p*{B)blocks.24.post_attention_layernorm.weightj% locationqwen3_0.6B_fp32.onnx.dataj offset200704j length4096p*B!blocks.24.self_attn.k_norm.weightJ0@=<<ѻ@<?>;?8<&@b=?/?>?@@5@@S@???@??:@?@????7?@@?@B@@\@?@=@?&@<@!@@C@?%@ @@9@@@@@@>]<,=@@<@?@@:??<@?=?@? ?8@??O@w? @@>@4@ @?@?@#@??@@@@ @@@ @@1@ A1@$@$@ @E@?(@?@B@@@@@@*B!blocks.24.self_attn.q_norm.weightJ?H=*X=?<W??@??@@ @?5@@A@?>@??????????@???? @@????@?????????????????>?? ?K????Q<2<<u?u?? @??#@@@?@@/@?@@???????????????@??!??=?*rB blocks.25.input_layernorm.weightj% locationqwen3_0.6B_fp32.onnx.dataj offset204800j length4096p*{B)blocks.25.post_attention_layernorm.weightj% locationqwen3_0.6B_fp32.onnx.dataj offset208896j length4096p*B!blocks.25.self_attn.k_norm.weightJ"@?9?]<m;?:?$;q??@??g;? >;?;@?4@?@???2@??-@-@?@z??@?@@$@@ @??@@ @@@@@H@D@@@@@k@@9@'>?<???;?+;???@ú.@8=?@??c@=??R@?e @ @C???????F@?@@@@@)@O@ @@ @@ @@@@@@N@@@@@@@@*B!blocks.25.self_attn.q_norm.weightJz?????n;]<?: @@<=?@?Q@U@<<??:@??@???@???@????? @??@?????@@?????????2?@?C???6?)?q;??@@?? @><?@+@?<?=E@@?@^@v??@?}??P=???@??????????????y???????????,?1?y?Z?{?i?*rB blocks.26.input_layernorm.weightj% locationqwen3_0.6B_fp32.onnx.dataj offset212992j length4096p*{B)blocks.26.post_attention_layernorm.weightj% locationqwen3_0.6B_fp32.onnx.dataj offset217088j length4096p*B!blocks.26.self_attn.k_norm.weightJ???cڻպ???????_s?%A??}?b?(@F@ @@?@ @???:???????_@?????@???@@@`@Q@e@Z@O@S@V@Y@??6<???=:"?<?)<?`<?ӻ??4ۼ'@?I=??>=? @h@:?U??@U@????????????M????@@?k@o@Z@p@R@V@l@h@*B!blocks.26.self_attn.q_norm.weightJ@??;??@?}??<)@<?=d@==7@??=??=d????X?? @?? @????????????y???????V?r?S???????"@?? ;<@:<@d=?˼@=)@8@=<?:@? @r????;??@???????????????W@?????@L?????????`<????9@X???@???@[>?@&@??@U@??@{????????@???;@?? @?9@??@3@: @???*@????????H@???? @(@??@@@%@?*A@??@,@??@^@?*B!blocks.27.self_attn.q_norm.weightJH@0@@???@?????&??????????_???????@????????@????w?e@?????,@?@@????>^?L@@>:@&@@???@?????[??@???w?*????=????f=r?????????_?????????????@>?@@??@?>Y? @*hBfinal_layernorm.weightj% locationqwen3_0.6B_fp32.onnx.dataj offset229376j length4096p*iBonnx::MatMul_8565j% locationqwen3_0.6B_fp32.onnx.dataj offset233472j length8388608p*jBonnx::MatMul_8566j% locationqwen3_0.6B_fp32.onnx.dataj offset8622080j length4194304p*kBonnx::MatMul_8567j% locationqwen3_0.6B_fp32.onnx.dataj offset12816384j length4194304p*kBonnx::MatMul_8589j% locationqwen3_0.6B_fp32.onnx.dataj offset17010688j length8388608p*lBonnx::MatMul_8590j% locationqwen3_0.6B_fp32.onnx.dataj offset25399296j length12582912p*lBonnx::MatMul_8591j% locationqwen3_0.6B_fp32.onnx.dataj offset37982208j length12582912p*lBonnx::MatMul_8592j% locationqwen3_0.6B_fp32.onnx.dataj offset50565120j length12582912p*kBonnx::MatMul_8593j% locationqwen3_0.6B_fp32.onnx.dataj offset63148032j length8388608p*kBonnx::MatMul_8594j% locationqwen3_0.6B_fp32.onnx.dataj offset71536640j length4194304p*kBonnx::MatMul_8595j% locationqwen3_0.6B_fp32.onnx.dataj offset75730944j length4194304p*kBonnx::MatMul_8617j% locationqwen3_0.6B_fp32.onnx.dataj offset79925248j length8388608p*lBonnx::MatMul_8618j% locationqwen3_0.6B_fp32.onnx.dataj offset88313856j length12582912p*mBonnx::MatMul_8619j% locationqwen3_0.6B_fp32.onnx.dataj offset 100896768j length12582912p*mBonnx::MatMul_8620j% locationqwen3_0.6B_fp32.onnx.dataj offset 113479680j length12582912p*lBonnx::MatMul_8621j% locationqwen3_0.6B_fp32.onnx.dataj offset 126062592j length8388608p*lBonnx::MatMul_8622j% locationqwen3_0.6B_fp32.onnx.dataj offset 134451200j length4194304p*lBonnx::MatMul_8623j% locationqwen3_0.6B_fp32.onnx.dataj offset 138645504j length4194304p*lBonnx::MatMul_8645j% locationqwen3_0.6B_fp32.onnx.dataj offset 142839808j length8388608p*mBonnx::MatMul_8646j% locationqwen3_0.6B_fp32.onnx.dataj offset 151228416j length12582912p*mBonnx::MatMul_8647j% locationqwen3_0.6B_fp32.onnx.dataj offset 163811328j length12582912p*mBonnx::MatMul_8648j% locationqwen3_0.6B_fp32.onnx.dataj offset 176394240j length12582912p*lBonnx::MatMul_8649j% locationqwen3_0.6B_fp32.onnx.dataj offset 188977152j length8388608p*lBonnx::MatMul_8650j% locationqwen3_0.6B_fp32.onnx.dataj offset 197365760j length4194304p*lBonnx::MatMul_8651j% locationqwen3_0.6B_fp32.onnx.dataj offset 201560064j length4194304p*lBonnx::MatMul_8673j% locationqwen3_0.6B_fp32.onnx.dataj offset 205754368j length8388608p*mBonnx::MatMul_8674j% locationqwen3_0.6B_fp32.onnx.dataj offset 214142976j length12582912p*mBonnx::MatMul_8675j% locationqwen3_0.6B_fp32.onnx.dataj offset 226725888j length12582912p*mBonnx::MatMul_8676j% locationqwen3_0.6B_fp32.onnx.dataj offset 239308800j length12582912p*lBonnx::MatMul_8677j% locationqwen3_0.6B_fp32.onnx.dataj offset 251891712j length8388608p*lBonnx::MatMul_8678j% locationqwen3_0.6B_fp32.onnx.dataj offset 260280320j length4194304p*lBonnx::MatMul_8679j% locationqwen3_0.6B_fp32.onnx.dataj offset 264474624j length4194304p*lBonnx::MatMul_8701j% locationqwen3_0.6B_fp32.onnx.dataj offset 268668928j length8388608p*mBonnx::MatMul_8702j% locationqwen3_0.6B_fp32.onnx.dataj offset 277057536j length12582912p*mBonnx::MatMul_8703j% locationqwen3_0.6B_fp32.onnx.dataj offset 289640448j length12582912p*mBonnx::MatMul_8704j% locationqwen3_0.6B_fp32.onnx.dataj offset 302223360j length12582912p*lBonnx::MatMul_8705j% locationqwen3_0.6B_fp32.onnx.dataj offset 314806272j length8388608p*lBonnx::MatMul_8706j% locationqwen3_0.6B_fp32.onnx.dataj offset 323194880j length4194304p*lBonnx::MatMul_8707j% locationqwen3_0.6B_fp32.onnx.dataj offset 327389184j length4194304p*lBonnx::MatMul_8729j% locationqwen3_0.6B_fp32.onnx.dataj offset 331583488j length8388608p*mBonnx::MatMul_8730j% locationqwen3_0.6B_fp32.onnx.dataj offset 339972096j length12582912p*mBonnx::MatMul_8731j% locationqwen3_0.6B_fp32.onnx.dataj offset 352555008j length12582912p*mBonnx::MatMul_8732j% locationqwen3_0.6B_fp32.onnx.dataj offset 365137920j length12582912p*lBonnx::MatMul_8733j% locationqwen3_0.6B_fp32.onnx.dataj offset 377720832j length8388608p*lBonnx::MatMul_8734j% locationqwen3_0.6B_fp32.onnx.dataj offset 386109440j length4194304p*lBonnx::MatMul_8735j% locationqwen3_0.6B_fp32.onnx.dataj offset 390303744j length4194304p*lBonnx::MatMul_8757j% locationqwen3_0.6B_fp32.onnx.dataj offset 394498048j length8388608p*mBonnx::MatMul_8758j% locationqwen3_0.6B_fp32.onnx.dataj offset 402886656j length12582912p*mBonnx::MatMul_8759j% locationqwen3_0.6B_fp32.onnx.dataj offset 415469568j length12582912p*mBonnx::MatMul_8760j% locationqwen3_0.6B_fp32.onnx.dataj offset 428052480j length12582912p*lBonnx::MatMul_8761j% locationqwen3_0.6B_fp32.onnx.dataj offset 440635392j length8388608p*lBonnx::MatMul_8762j% locationqwen3_0.6B_fp32.onnx.dataj offset 449024000j length4194304p*lBonnx::MatMul_8763j% locationqwen3_0.6B_fp32.onnx.dataj offset 453218304j length4194304p*lBonnx::MatMul_8785j% locationqwen3_0.6B_fp32.onnx.dataj offset 457412608j length8388608p*mBonnx::MatMul_8786j% locationqwen3_0.6B_fp32.onnx.dataj offset 465801216j length12582912p*mBonnx::MatMul_8787j% locationqwen3_0.6B_fp32.onnx.dataj offset 478384128j length12582912p*mBonnx::MatMul_8788j% locationqwen3_0.6B_fp32.onnx.dataj offset 490967040j length12582912p*lBonnx::MatMul_8789j% locationqwen3_0.6B_fp32.onnx.dataj offset 503549952j length8388608p*lBonnx::MatMul_8790j% locationqwen3_0.6B_fp32.onnx.dataj offset 511938560j length4194304p*lBonnx::MatMul_8791j% locationqwen3_0.6B_fp32.onnx.dataj offset 516132864j length4194304p*lBonnx::MatMul_8813j% locationqwen3_0.6B_fp32.onnx.dataj offset 520327168j length8388608p*mBonnx::MatMul_8814j% locationqwen3_0.6B_fp32.onnx.dataj offset 528715776j length12582912p*mBonnx::MatMul_8815j% locationqwen3_0.6B_fp32.onnx.dataj offset 541298688j length12582912p*mBonnx::MatMul_8816j% locationqwen3_0.6B_fp32.onnx.dataj offset 553881600j length12582912p*lBonnx::MatMul_8817j% locationqwen3_0.6B_fp32.onnx.dataj offset 566464512j length8388608p*lBonnx::MatMul_8818j% locationqwen3_0.6B_fp32.onnx.dataj offset 574853120j length4194304p*lBonnx::MatMul_8819j% locationqwen3_0.6B_fp32.onnx.dataj offset 579047424j length4194304p*lBonnx::MatMul_8841j% locationqwen3_0.6B_fp32.onnx.dataj offset 583241728j length8388608p*mBonnx::MatMul_8842j% locationqwen3_0.6B_fp32.onnx.dataj offset 591630336j length12582912p*mBonnx::MatMul_8843j% locationqwen3_0.6B_fp32.onnx.dataj offset 604213248j length12582912p*mBonnx::MatMul_8844j% locationqwen3_0.6B_fp32.onnx.dataj offset 616796160j length12582912p*lBonnx::MatMul_8845j% locationqwen3_0.6B_fp32.onnx.dataj offset 629379072j length8388608p*lBonnx::MatMul_8846j% locationqwen3_0.6B_fp32.onnx.dataj offset 637767680j length4194304p*lBonnx::MatMul_8847j% locationqwen3_0.6B_fp32.onnx.dataj offset 641961984j length4194304p*lBonnx::MatMul_8869j% locationqwen3_0.6B_fp32.onnx.dataj offset 646156288j length8388608p*mBonnx::MatMul_8870j% locationqwen3_0.6B_fp32.onnx.dataj offset 654544896j length12582912p*mBonnx::MatMul_8871j% locationqwen3_0.6B_fp32.onnx.dataj offset 667127808j length12582912p*mBonnx::MatMul_8872j% locationqwen3_0.6B_fp32.onnx.dataj offset 679710720j length12582912p*lBonnx::MatMul_8873j% locationqwen3_0.6B_fp32.onnx.dataj offset 692293632j length8388608p*lBonnx::MatMul_8874j% locationqwen3_0.6B_fp32.onnx.dataj offset 700682240j length4194304p*lBonnx::MatMul_8875j% locationqwen3_0.6B_fp32.onnx.dataj offset 704876544j length4194304p*lBonnx::MatMul_8897j% locationqwen3_0.6B_fp32.onnx.dataj offset 709070848j length8388608p*mBonnx::MatMul_8898j% locationqwen3_0.6B_fp32.onnx.dataj offset 717459456j length12582912p*mBonnx::MatMul_8899j% locationqwen3_0.6B_fp32.onnx.dataj offset 730042368j length12582912p*mBonnx::MatMul_8900j% locationqwen3_0.6B_fp32.onnx.dataj offset 742625280j length12582912p*lBonnx::MatMul_8901j% locationqwen3_0.6B_fp32.onnx.dataj offset 755208192j length8388608p*lBonnx::MatMul_8902j% locationqwen3_0.6B_fp32.onnx.dataj offset 763596800j length4194304p*lBonnx::MatMul_8903j% locationqwen3_0.6B_fp32.onnx.dataj offset 767791104j length4194304p*lBonnx::MatMul_8925j% locationqwen3_0.6B_fp32.onnx.dataj offset 771985408j length8388608p*mBonnx::MatMul_8926j% locationqwen3_0.6B_fp32.onnx.dataj offset 780374016j length12582912p*mBonnx::MatMul_8927j% locationqwen3_0.6B_fp32.onnx.dataj offset 792956928j length12582912p*mBonnx::MatMul_8928j% locationqwen3_0.6B_fp32.onnx.dataj offset 805539840j length12582912p*lBonnx::MatMul_8929j% locationqwen3_0.6B_fp32.onnx.dataj offset 818122752j length8388608p*lBonnx::MatMul_8930j% locationqwen3_0.6B_fp32.onnx.dataj offset 826511360j length4194304p*lBonnx::MatMul_8931j% locationqwen3_0.6B_fp32.onnx.dataj offset 830705664j length4194304p*lBonnx::MatMul_8953j% locationqwen3_0.6B_fp32.onnx.dataj offset 834899968j length8388608p*mBonnx::MatMul_8954j% locationqwen3_0.6B_fp32.onnx.dataj offset 843288576j length12582912p*mBonnx::MatMul_8955j% locationqwen3_0.6B_fp32.onnx.dataj offset 855871488j length12582912p*mBonnx::MatMul_8956j% locationqwen3_0.6B_fp32.onnx.dataj offset 868454400j length12582912p*lBonnx::MatMul_8957j% locationqwen3_0.6B_fp32.onnx.dataj offset 881037312j length8388608p*lBonnx::MatMul_8958j% locationqwen3_0.6B_fp32.onnx.dataj offset 889425920j length4194304p*lBonnx::MatMul_8959j% locationqwen3_0.6B_fp32.onnx.dataj offset 893620224j length4194304p*lBonnx::MatMul_8981j% locationqwen3_0.6B_fp32.onnx.dataj offset 897814528j length8388608p*mBonnx::MatMul_8982j% locationqwen3_0.6B_fp32.onnx.dataj offset 906203136j length12582912p*mBonnx::MatMul_8983j% locationqwen3_0.6B_fp32.onnx.dataj offset 918786048j length12582912p*mBonnx::MatMul_8984j% locationqwen3_0.6B_fp32.onnx.dataj offset 931368960j length12582912p*lBonnx::MatMul_8985j% locationqwen3_0.6B_fp32.onnx.dataj offset 943951872j length8388608p*lBonnx::MatMul_8986j% locationqwen3_0.6B_fp32.onnx.dataj offset 952340480j length4194304p*lBonnx::MatMul_8987j% locationqwen3_0.6B_fp32.onnx.dataj offset 956534784j length4194304p*lBonnx::MatMul_9009j% locationqwen3_0.6B_fp32.onnx.dataj offset 960729088j length8388608p*mBonnx::MatMul_9010j% locationqwen3_0.6B_fp32.onnx.dataj offset 969117696j length12582912p*mBonnx::MatMul_9011j% locationqwen3_0.6B_fp32.onnx.dataj offset 981700608j length12582912p*mBonnx::MatMul_9012j% locationqwen3_0.6B_fp32.onnx.dataj offset 994283520j length12582912p*mBonnx::MatMul_9013j% locationqwen3_0.6B_fp32.onnx.dataj offset 1006866432j length8388608p*mBonnx::MatMul_9014j% locationqwen3_0.6B_fp32.onnx.dataj offset 1015255040j length4194304p*mBonnx::MatMul_9015j% locationqwen3_0.6B_fp32.onnx.dataj offset 1019449344j length4194304p*mBonnx::MatMul_9037j% locationqwen3_0.6B_fp32.onnx.dataj offset 1023643648j length8388608p*nBonnx::MatMul_9038j% locationqwen3_0.6B_fp32.onnx.dataj offset 1032032256j length12582912p*nBonnx::MatMul_9039j% locationqwen3_0.6B_fp32.onnx.dataj offset 1044615168j length12582912p*nBonnx::MatMul_9040j% locationqwen3_0.6B_fp32.onnx.dataj offset 1057198080j length12582912p*mBonnx::MatMul_9041j% locationqwen3_0.6B_fp32.onnx.dataj offset 1069780992j length8388608p*mBonnx::MatMul_9042j% locationqwen3_0.6B_fp32.onnx.dataj offset 1078169600j length4194304p*mBonnx::MatMul_9043j% locationqwen3_0.6B_fp32.onnx.dataj offset 1082363904j length4194304p*mBonnx::MatMul_9065j% locationqwen3_0.6B_fp32.onnx.dataj offset 1086558208j length8388608p*nBonnx::MatMul_9066j% locationqwen3_0.6B_fp32.onnx.dataj offset 1094946816j length12582912p*nBonnx::MatMul_9067j% locationqwen3_0.6B_fp32.onnx.dataj offset 1107529728j length12582912p*nBonnx::MatMul_9068j% locationqwen3_0.6B_fp32.onnx.dataj offset 1120112640j length12582912p*mBonnx::MatMul_9069j% locationqwen3_0.6B_fp32.onnx.dataj offset 1132695552j length8388608p*mBonnx::MatMul_9070j% locationqwen3_0.6B_fp32.onnx.dataj offset 1141084160j length4194304p*mBonnx::MatMul_9071j% locationqwen3_0.6B_fp32.onnx.dataj offset 1145278464j length4194304p*mBonnx::MatMul_9093j% locationqwen3_0.6B_fp32.onnx.dataj offset 1149472768j length8388608p*nBonnx::MatMul_9094j% locationqwen3_0.6B_fp32.onnx.dataj offset 1157861376j length12582912p*nBonnx::MatMul_9095j% locationqwen3_0.6B_fp32.onnx.dataj offset 1170444288j length12582912p*nBonnx::MatMul_9096j% locationqwen3_0.6B_fp32.onnx.dataj offset 1183027200j length12582912p*mBonnx::MatMul_9097j% locationqwen3_0.6B_fp32.onnx.dataj offset 1195610112j length8388608p*mBonnx::MatMul_9098j% locationqwen3_0.6B_fp32.onnx.dataj offset 1203998720j length4194304p*mBonnx::MatMul_9099j% locationqwen3_0.6B_fp32.onnx.dataj offset 1208193024j length4194304p*mBonnx::MatMul_9121j% locationqwen3_0.6B_fp32.onnx.dataj offset 1212387328j length8388608p*nBonnx::MatMul_9122j% locationqwen3_0.6B_fp32.onnx.dataj offset 1220775936j length12582912p*nBonnx::MatMul_9123j% locationqwen3_0.6B_fp32.onnx.dataj offset 1233358848j length12582912p*nBonnx::MatMul_9124j% locationqwen3_0.6B_fp32.onnx.dataj offset 1245941760j length12582912p*mBonnx::MatMul_9125j% locationqwen3_0.6B_fp32.onnx.dataj offset 1258524672j length8388608p*mBonnx::MatMul_9126j% locationqwen3_0.6B_fp32.onnx.dataj offset 1266913280j length4194304p*mBonnx::MatMul_9127j% locationqwen3_0.6B_fp32.onnx.dataj offset 1271107584j length4194304p*mBonnx::MatMul_9149j% locationqwen3_0.6B_fp32.onnx.dataj offset 1275301888j length8388608p*nBonnx::MatMul_9150j% locationqwen3_0.6B_fp32.onnx.dataj offset 1283690496j length12582912p*nBonnx::MatMul_9151j% locationqwen3_0.6B_fp32.onnx.dataj offset 1296273408j length12582912p*nBonnx::MatMul_9152j% locationqwen3_0.6B_fp32.onnx.dataj offset 1308856320j length12582912p*mBonnx::MatMul_9153j% locationqwen3_0.6B_fp32.onnx.dataj offset 1321439232j length8388608p*mBonnx::MatMul_9154j% locationqwen3_0.6B_fp32.onnx.dataj offset 1329827840j length4194304p*mBonnx::MatMul_9155j% locationqwen3_0.6B_fp32.onnx.dataj offset 1334022144j length4194304p*mBonnx::MatMul_9177j% locationqwen3_0.6B_fp32.onnx.dataj offset 1338216448j length8388608p*nBonnx::MatMul_9178j% locationqwen3_0.6B_fp32.onnx.dataj offset 1346605056j length12582912p*nBonnx::MatMul_9179j% locationqwen3_0.6B_fp32.onnx.dataj offset 1359187968j length12582912p*nBonnx::MatMul_9180j% locationqwen3_0.6B_fp32.onnx.dataj offset 1371770880j length12582912p*mBonnx::MatMul_9181j% locationqwen3_0.6B_fp32.onnx.dataj offset 1384353792j length8388608p*mBonnx::MatMul_9182j% locationqwen3_0.6B_fp32.onnx.dataj offset 1392742400j length4194304p*mBonnx::MatMul_9183j% locationqwen3_0.6B_fp32.onnx.dataj offset 1396936704j length4194304p*mBonnx::MatMul_9205j% locationqwen3_0.6B_fp32.onnx.dataj offset 1401131008j length8388608p*nBonnx::MatMul_9206j% locationqwen3_0.6B_fp32.onnx.dataj offset 1409519616j length12582912p*nBonnx::MatMul_9207j% locationqwen3_0.6B_fp32.onnx.dataj offset 1422102528j length12582912p*nBonnx::MatMul_9208j% locationqwen3_0.6B_fp32.onnx.dataj offset 1434685440j length12582912p*mBonnx::MatMul_9209j% locationqwen3_0.6B_fp32.onnx.dataj offset 1447268352j length8388608p*mBonnx::MatMul_9210j% locationqwen3_0.6B_fp32.onnx.dataj offset 1455656960j length4194304p*mBonnx::MatMul_9211j% locationqwen3_0.6B_fp32.onnx.dataj offset 1459851264j length4194304p*mBonnx::MatMul_9233j% locationqwen3_0.6B_fp32.onnx.dataj offset 1464045568j length8388608p*nBonnx::MatMul_9234j% locationqwen3_0.6B_fp32.onnx.dataj offset 1472434176j length12582912p*nBonnx::MatMul_9235j% locationqwen3_0.6B_fp32.onnx.dataj offset 1485017088j length12582912p*nBonnx::MatMul_9236j% locationqwen3_0.6B_fp32.onnx.dataj offset 1497600000j length12582912p*mBonnx::MatMul_9237j% locationqwen3_0.6B_fp32.onnx.dataj offset 1510182912j length8388608p*mBonnx::MatMul_9238j% locationqwen3_0.6B_fp32.onnx.dataj offset 1518571520j length4194304p*mBonnx::MatMul_9239j% locationqwen3_0.6B_fp32.onnx.dataj offset 1522765824j length4194304p*mBonnx::MatMul_9261j% locationqwen3_0.6B_fp32.onnx.dataj offset 1526960128j length8388608p*nBonnx::MatMul_9262j% locationqwen3_0.6B_fp32.onnx.dataj offset 1535348736j length12582912p*nBonnx::MatMul_9263j% locationqwen3_0.6B_fp32.onnx.dataj offset 1547931648j length12582912p*nBonnx::MatMul_9264j% locationqwen3_0.6B_fp32.onnx.dataj offset 1560514560j length12582912p*mBonnx::MatMul_9265j% locationqwen3_0.6B_fp32.onnx.dataj offset 1573097472j length8388608p*mBonnx::MatMul_9266j% locationqwen3_0.6B_fp32.onnx.dataj offset 1581486080j length4194304p*mBonnx::MatMul_9267j% locationqwen3_0.6B_fp32.onnx.dataj offset 1585680384j length4194304p*mBonnx::MatMul_9289j% locationqwen3_0.6B_fp32.onnx.dataj offset 1589874688j length8388608p*nBonnx::MatMul_9290j% locationqwen3_0.6B_fp32.onnx.dataj offset 1598263296j length12582912p*nBonnx::MatMul_9291j% locationqwen3_0.6B_fp32.onnx.dataj offset 1610846208j length12582912p*nBonnx::MatMul_9292j% locationqwen3_0.6B_fp32.onnx.dataj offset 1623429120j length12582912p*mBonnx::MatMul_9293j% locationqwen3_0.6B_fp32.onnx.dataj offset 1636012032j length8388608p*mBonnx::MatMul_9294j% locationqwen3_0.6B_fp32.onnx.dataj offset 1644400640j length4194304p*mBonnx::MatMul_9295j% locationqwen3_0.6B_fp32.onnx.dataj offset 1648594944j length4194304p*mBonnx::MatMul_9317j% locationqwen3_0.6B_fp32.onnx.dataj offset 1652789248j length8388608p*nBonnx::MatMul_9318j% locationqwen3_0.6B_fp32.onnx.dataj offset 1661177856j length12582912p*nBonnx::MatMul_9319j% locationqwen3_0.6B_fp32.onnx.dataj offset 1673760768j length12582912p*nBonnx::MatMul_9320j% locationqwen3_0.6B_fp32.onnx.dataj offset 1686343680j length12582912p*mBonnx::MatMul_9321j% locationqwen3_0.6B_fp32.onnx.dataj offset 1698926592j length8388608p*mBonnx::MatMul_9322j% locationqwen3_0.6B_fp32.onnx.dataj offset 1707315200j length4194304p*mBonnx::MatMul_9323j% locationqwen3_0.6B_fp32.onnx.dataj offset 1711509504j length4194304p*mBonnx::MatMul_9345j% locationqwen3_0.6B_fp32.onnx.dataj offset 1715703808j length8388608p*nBonnx::MatMul_9346j% locationqwen3_0.6B_fp32.onnx.dataj offset 1724092416j length12582912p*nBonnx::MatMul_9347j% locationqwen3_0.6B_fp32.onnx.dataj offset 1736675328j length12582912p*nBonnx::MatMul_9348j% locationqwen3_0.6B_fp32.onnx.dataj offset 1749258240j length12582912p*p Bonnx::MatMul_9352j% locationqwen3_0.6B_fp32.onnx.dataj offset 1761841152j length 622329856pZ' input_ids  seq_len  Z6 attention_mask$ "   seq_len seq_lenZ% position_ids   seq_lenZ= past_key_values* ($     history_len  bB logits8 62 MatMullogits_dim_0 MatMullogits_dim_1  b] hidden_statesL JF MatMullogits_dim_0 MatMullogits_dim_1 Mulhidden_states_dim_2b? presents3 1-    Concatpresents_dim_3  B